From 56a6c3514b82636811b69ae08a9a7952f6649c83 Mon Sep 17 00:00:00 2001 From: duskzhen Date: Thu, 5 Feb 2026 22:26:10 +0800 Subject: [PATCH 1/4] Merge pull request #1302 from ThinkInAIXYZ/bugfix/question-end-error fix(agent): mark question tool messages sent --- src/main/presenter/agentPresenter/index.ts | 3 +++ .../presenter/agentPresenter/streaming/llmEventHandler.ts | 4 ++++ .../presenter/sessionPresenter/managers/messageManager.ts | 8 ++++++++ 3 files changed, 15 insertions(+) diff --git a/src/main/presenter/agentPresenter/index.ts b/src/main/presenter/agentPresenter/index.ts index ee403f94f..2833dc5ad 100644 --- a/src/main/presenter/agentPresenter/index.ts +++ b/src/main/presenter/agentPresenter/index.ts @@ -400,6 +400,9 @@ export class AgentPresenter implements IAgentPresenter { } await this.messageManager.editMessage(messageId, JSON.stringify(content)) + if (message.status === 'pending') { + await this.messageManager.updateMessageStatus(messageId, 'sent') + } presenter.sessionManager.clearPendingQuestion(message.conversationId) presenter.sessionManager.setStatus(message.conversationId, 'idle') } diff --git a/src/main/presenter/agentPresenter/streaming/llmEventHandler.ts b/src/main/presenter/agentPresenter/streaming/llmEventHandler.ts index 9709ca895..9eb76ded9 100644 --- a/src/main/presenter/agentPresenter/streaming/llmEventHandler.ts +++ b/src/main/presenter/agentPresenter/streaming/llmEventHandler.ts @@ -399,6 +399,10 @@ export class LLMEventHandler { {}, state.message.content ) + if (hasPendingQuestions) { + // Question tool ends the assistant message even when waiting for user input. + await this.messageManager.updateMessageStatus(eventId, 'sent') + } this.searchingMessages.delete(eventId) presenter.sessionManager.setStatus(state.conversationId, 'waiting_permission') if (!hasPendingPermissions) { diff --git a/src/main/presenter/sessionPresenter/managers/messageManager.ts b/src/main/presenter/sessionPresenter/managers/messageManager.ts index c1b5001c2..30c917aed 100644 --- a/src/main/presenter/sessionPresenter/managers/messageManager.ts +++ b/src/main/presenter/sessionPresenter/managers/messageManager.ts @@ -384,6 +384,14 @@ export class MessageManager implements IMessageManager { // 处理每个未完成的消息 for (const message of pendingMessages) { + const blocks = Array.isArray(message.content) ? message.content : [] + const hasQuestionRequest = blocks.some( + (block) => block.type === 'action' && block.action_type === 'question_request' + ) + if (hasQuestionRequest) { + await this.updateMessageStatus(message.id, 'sent') + continue + } await this.handleMessageError(message.id, 'common.error.sessionInterrupted') } } From 7a73428cfecddd4778597e1eec9c291f61310faa Mon Sep 17 00:00:00 2001 From: yyhhyyyyyy Date: Mon, 9 Feb 2026 15:57:31 +0800 Subject: [PATCH 2/4] refactor: route openai to responses (#1303) * refactor: route openai to responses * fix(i18n): localize openaiResponsesNotice --- resources/model-db/providers.json | 97844 +++++++++------- src/main/presenter/configPresenter/index.ts | 28 + .../presenter/configPresenter/providers.ts | 26 +- .../managers/providerInstanceManager.ts | 6 +- .../components/AddCustomProviderDialog.vue | 19 +- .../settings/components/ProviderApiConfig.vue | 12 + .../components/settings/ModelConfigDialog.vue | 24 +- src/renderer/src/i18n/da-DK/settings.json | 1 + src/renderer/src/i18n/en-US/settings.json | 1 + src/renderer/src/i18n/fa-IR/settings.json | 1 + src/renderer/src/i18n/fr-FR/settings.json | 1 + src/renderer/src/i18n/he-IL/settings.json | 1 + src/renderer/src/i18n/ja-JP/settings.json | 1 + src/renderer/src/i18n/ko-KR/settings.json | 1 + src/renderer/src/i18n/pt-BR/settings.json | 1 + src/renderer/src/i18n/ru-RU/settings.json | 1 + src/renderer/src/i18n/zh-CN/settings.json | 1 + src/renderer/src/i18n/zh-HK/settings.json | 1 + src/renderer/src/i18n/zh-TW/settings.json | 1 + 19 files changed, 54121 insertions(+), 43850 deletions(-) diff --git a/resources/model-db/providers.json b/resources/model-db/providers.json index 4552b1fec..08c353c85 100644 --- a/resources/model-db/providers.json +++ b/resources/model-db/providers.json @@ -1,50 +1,47 @@ { "providers": { - "moonshot": { - "id": "moonshot", - "name": "Moonshot AI (China)", - "display_name": "Moonshot AI (China)", - "api": "https://api.moonshot.cn/v1", - "doc": "https://platform.moonshot.cn/docs/api/chat", + "privatemode-ai": { + "id": "privatemode-ai", + "name": "Privatemode AI", + "display_name": "Privatemode AI", + "api": "http://localhost:8080/v1", + "doc": "https://docs.privatemode.ai/api/overview", "models": [ { - "id": "kimi-k2-thinking-turbo", - "name": "Kimi K2 Thinking Turbo", - "display_name": "Kimi K2 Thinking Turbo", + "id": "whisper-large-v3", + "name": "Whisper large-v3", + "display_name": "Whisper large-v3", "modalities": { "input": [ - "text" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 0, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "knowledge": "2023-09", + "release_date": "2023-09-01", + "last_updated": "2023-09-01", "cost": { - "input": 1.15, - "output": 8, - "cache_read": 0.15 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "qwen3-embedding-4b", + "name": "Qwen3-Embedding 4B", + "display_name": "Qwen3-Embedding 4B", "modalities": { "input": [ "text" @@ -54,31 +51,28 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 32000, + "output": 2560 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "knowledge": "2025-06", + "release_date": "2025-06-06", + "last_updated": "2025-06-06", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "kimi-k2-0905-preview", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "gpt-oss-120b", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ "text" @@ -88,63 +82,61 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2025-08", + "release_date": "2025-08-04", + "last_updated": "2025-08-14", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "kimi-k2-0711-preview", - "name": "Kimi K2 0711", - "display_name": "Kimi K2 0711", + "id": "gemma-3-27b", + "name": "Gemma 3 27B", + "display_name": "Gemma 3 27B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-14", - "last_updated": "2025-07-14", + "knowledge": "2024-08", + "release_date": "2025-03-12", + "last_updated": "2025-03-12", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "kimi-k2-turbo-preview", - "name": "Kimi K2 Turbo", - "display_name": "Kimi K2 Turbo", + "id": "qwen3-coder-30b-a3b", + "name": "Qwen3-Coder 30B-A3B", + "display_name": "Qwen3-Coder 30B-A3B", "modalities": { "input": [ "text" @@ -154,8 +146,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -164,29 +156,27 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 2.4, - "output": 10, - "cache_read": 0.6 - }, - "type": "chat" + "input": 0, + "output": 0 + } } ] }, - "lucidquery": { - "id": "lucidquery", - "name": "LucidQuery AI", - "display_name": "LucidQuery AI", - "api": "https://lucidquery.com/api/v1", - "doc": "https://lucidquery.com/api/docs", + "moonshot": { + "id": "moonshot", + "name": "Moonshot AI (China)", + "display_name": "Moonshot AI (China)", + "api": "https://api.moonshot.cn/v1", + "doc": "https://platform.moonshot.cn/docs/api/chat", "models": [ { - "id": "lucidquery-nexus-coder", - "name": "LucidQuery Nexus Coder", - "display_name": "LucidQuery Nexus Coder", + "id": "kimi-k2-0905-preview", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ "text" @@ -196,72 +186,29 @@ ] }, "limit": { - "context": 250000, - "output": 60000 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-01", - "release_date": "2025-09-01", - "last_updated": "2025-09-01", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 2, - "output": 5 - }, - "type": "chat" + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 + } }, { - "id": "lucidnova-rf1-100b", - "name": "LucidNova RF1 100B", - "display_name": "LucidNova RF1 100B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 120000, - "output": 8000 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-09-16", - "release_date": "2024-12-28", - "last_updated": "2025-09-10", - "cost": { - "input": 2, - "output": 5 - }, - "type": "chat" - } - ] - }, - "moonshot-ai": { - "id": "moonshot-ai", - "name": "Moonshot AI", - "display_name": "Moonshot AI", - "api": "https://api.moonshot.ai/v1", - "doc": "https://platform.moonshot.ai/docs/api/chat", - "models": [ - { - "id": "kimi-k2-thinking-turbo", - "name": "Kimi K2 Thinking Turbo", - "display_name": "Kimi K2 Thinking Turbo", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -286,16 +233,15 @@ "release_date": "2025-11-06", "last_updated": "2025-11-06", "cost": { - "input": 1.15, - "output": 8, + "input": 0.6, + "output": 2.5, "cache_read": 0.15 - }, - "type": "chat" + } }, { - "id": "kimi-k2-turbo-preview", - "name": "Kimi K2 Turbo", - "display_name": "Kimi K2 Turbo", + "id": "kimi-k2-0711-preview", + "name": "Kimi K2 0711", + "display_name": "Kimi K2 0711", "modalities": { "input": [ "text" @@ -305,8 +251,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -316,52 +262,53 @@ "attachment": false, "open_weights": true, "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "release_date": "2025-07-14", + "last_updated": "2025-07-14", "cost": { - "input": 2.4, - "output": 10, - "cache_read": 0.6 - }, - "type": "chat" + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 + } }, { - "id": "kimi-k2-0711-preview", - "name": "Kimi K2 0711", - "display_name": "Kimi K2 0711", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-14", - "last_updated": "2025-07-14", + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { "input": 0.6, - "output": 2.5, - "cache_read": 0.15 - }, - "type": "chat" + "output": 3, + "cache_read": 0.1 + } }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "kimi-k2-turbo-preview", + "name": "Kimi K2 Turbo", + "display_name": "Kimi K2 Turbo", "modalities": { "input": [ "text" @@ -377,25 +324,23 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 - }, - "type": "chat" + "input": 2.4, + "output": 10, + "cache_read": 0.6 + } }, { - "id": "kimi-k2-0905-preview", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "kimi-k2-thinking-turbo", + "name": "Kimi K2 Thinking Turbo", + "display_name": "Kimi K2 Thinking Turbo", "modalities": { "input": [ "text" @@ -411,79 +356,77 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.6, - "output": 2.5, + "input": 1.15, + "output": 8, "cache_read": 0.15 - }, - "type": "chat" + } } ] }, - "zai-coding-plan": { - "id": "zai-coding-plan", - "name": "Z.AI Coding Plan", - "display_name": "Z.AI Coding Plan", - "api": "https://api.z.ai/api/coding/paas/v4", - "doc": "https://docs.z.ai/devpack/overview", + "firmware": { + "id": "firmware", + "name": "Firmware", + "display_name": "Firmware", + "api": "https://app.firmware.ai/api/v1", + "doc": "https://docs.firmware.ai", "models": [ { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "grok-4-fast-non-reasoning", + "name": "Grok 4 Fast (Non-Reasoning)", + "display_name": "Grok 4 Fast (Non-Reasoning)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "attachment": true, + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, - "type": "chat" + "output": 0 + } }, { - "id": "glm-4.5-flash", - "name": "GLM-4.5-Flash", - "display_name": "GLM-4.5-Flash", + "id": "grok-4-fast-reasoning", + "name": "Grok 4 Fast (Reasoning)", + "display_name": "Grok 4 Fast (Reasoning)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -491,34 +434,35 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, - "type": "chat" + "output": 0 + } }, { - "id": "glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -526,23 +470,20 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, - "type": "chat" + "output": 0 + } }, { - "id": "glm-4.5-air", - "name": "GLM-4.5-Air", - "display_name": "GLM-4.5-Air", + "id": "grok-code-fast-1", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ "text" @@ -552,8 +493,8 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 256000, + "output": 10000 }, "temperature": true, "tool_call": true, @@ -562,35 +503,32 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": false, + "knowledge": "2023-10", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, - "type": "chat" + "output": 0 + } }, { - "id": "glm-4.5v", - "name": "GLM-4.5V", - "display_name": "GLM-4.5V", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 16384 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -599,20 +537,19 @@ "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "kimi-k2-thinking-turbo", + "name": "Kimi K2 Thinking Turbo", + "display_name": "Kimi K2 Thinking Turbo", "modalities": { "input": [ "text" @@ -622,8 +559,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -632,36 +569,32 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "open_weights": false, + "release_date": "1970-01-01", + "last_updated": "1970-01-01", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, - "type": "chat" + "input": 1.15, + "output": 8 + } }, { - "id": "glm-4.6v", - "name": "GLM-4.6V", - "display_name": "GLM-4.6V", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 - }, + "context": 200000, + "output": 128000 + }, "temperature": true, "tool_call": true, "reasoning": { @@ -669,40 +602,32 @@ "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { "input": 0, "output": 0 - }, - "type": "chat" - } - ] - }, - "xiaomi": { - "id": "xiaomi", - "name": "Xiaomi", - "display_name": "Xiaomi", - "api": "https://api.xiaomimimo.com/v1", - "doc": "https://platform.xiaomimimo.com/#/docs", - "models": [ + } + }, { - "id": "mimo-v2-flash", - "name": "MiMo-V2-Flash", - "display_name": "MiMo-V2-Flash", + "id": "claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -710,171 +635,188 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.07, - "output": 0.21 - }, - "type": "chat" - } - ] - }, - "alibaba": { - "id": "alibaba", - "name": "alibaba", - "display_name": "alibaba", - "api": "https://dashscope-intl.aliyuncs.com/compatible-mode/v1", - "doc": "https://www.alibabacloud.com/help/en/model-studio/models", - "models": [ + "input": 0, + "output": 0 + } + }, { - "id": "qwen3-livetranslate-flash-realtime", - "name": "Qwen3-LiveTranslate Flash Realtime", - "display_name": "Qwen3-LiveTranslate Flash Realtime", + "id": "deepseek-chat", + "name": "DeepSeek Chat", + "display_name": "DeepSeek Chat", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 53248, - "output": 4096 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "knowledge": "2024-07", + "release_date": "2024-12-26", + "last_updated": "2025-09-29", "cost": { - "input": 10, - "output": 10, - "input_audio": 10, - "output_audio": 38 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "qwen3-asr-flash", - "name": "Qwen3-ASR Flash", - "display_name": "Qwen3-ASR Flash", + "id": "gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ - "audio" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 53248, - "output": 4096 + "context": 1000000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-08", - "last_updated": "2025-09-08", + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.035, - "output": 0.035 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "qwen-omni-turbo", - "name": "Qwen-Omni Turbo", - "display_name": "Qwen-Omni Turbo", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", "image", "audio", - "video" + "video", + "pdf" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-19", - "last_updated": "2025-03-26", + "knowledge": "2025-01", + "release_date": "2025-07-17", + "last_updated": "2025-07-17", "cost": { - "input": 0.07, - "output": 0.27, - "input_audio": 4.44, - "output_audio": 8.89 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "qwen-vl-max", - "name": "Qwen-VL Max", - "display_name": "Qwen-VL Max", + "id": "kimi-k2.5", + "name": "Kimi-K2.5", + "display_name": "Kimi-K2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-04-08", - "last_updated": "2025-08-13", + "release_date": "1970-01-01", + "last_updated": "1970-01-01", "cost": { - "input": 0.8, - "output": 3.2 + "input": 0.1, + "output": 3 + } + }, + { + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] }, - "type": "chat" + "limit": { + "context": 200000, + "output": 64000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "qwen3-next-80b-a3b-instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "zai-glm-4.7", + "name": "Z.AI GLM-4.7", + "display_name": "Z.AI GLM-4.7", "modalities": { "input": [ "text" @@ -885,7 +827,7 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 40000 }, "temperature": true, "tool_call": true, @@ -894,19 +836,17 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09", - "last_updated": "2025-09", + "release_date": "1970-01-01", + "last_updated": "1970-01-01", "cost": { - "input": 0.5, - "output": 2 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "qwen-turbo", - "name": "Qwen Turbo", - "display_name": "Qwen Turbo", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -916,42 +856,28 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 262000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-11-01", - "last_updated": "2025-04-28", + "release_date": "1970-01-01", + "last_updated": "1970-01-01", "cost": { - "input": 0.05, - "output": 0.2, - "reasoning": 0.5 - }, - "type": "chat" + "input": 0.6, + "output": 2.5 + } }, { - "id": "qwen3-vl-235b-a22b", - "name": "Qwen3-VL 235B-A22B", - "display_name": "Qwen3-VL 235B-A22B", + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ "text", @@ -962,63 +888,62 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.7, - "output": 2.8, - "reasoning": 8.4 - }, - "type": "chat" + "input": 0, + "output": 0, + "cache_read": 0 + } }, { - "id": "qwen3-coder-flash", - "name": "Qwen3 Coder Flash", - "display_name": "Qwen3 Coder Flash", + "id": "gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "cost": { - "input": 0.3, - "output": 1.5 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "qwen3-vl-30b-a3b", - "name": "Qwen3-VL 30B-A3B", - "display_name": "Qwen3-VL 30B-A3B", + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ "text", @@ -1029,31 +954,30 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.2, - "output": 0.8, - "reasoning": 2.4 - }, - "type": "chat" + "input": 0, + "output": 0, + "cache_read": 0 + } }, { - "id": "qwen3-14b", - "name": "Qwen3 14B", - "display_name": "Qwen3 14B", + "id": "deepseek-reasoner", + "name": "DeepSeek Reasoner", + "display_name": "DeepSeek Reasoner", "modalities": { "input": [ "text" @@ -1063,48 +987,44 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "attachment": true, + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-09-29", "cost": { - "input": 0.35, - "output": 1.4, - "reasoning": 4.2 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "qvq-max", - "name": "QVQ Max", - "display_name": "QVQ Max", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -1112,21 +1032,20 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 1.2, - "output": 4.8 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "qwen-plus-character-ja", - "name": "Qwen Plus Character (Japanese)", - "display_name": "Qwen Plus Character (Japanese)", + "id": "gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -1136,170 +1055,182 @@ ] }, "limit": { - "context": 8192, - "output": 512 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01", - "last_updated": "2024-01", + "open_weights": true, + "release_date": "1970-01-01", + "last_updated": "1970-01-01", "cost": { - "input": 0.5, - "output": 1.4 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "qwen2-5-14b-instruct", - "name": "Qwen2.5 14B Instruct", - "display_name": "Qwen2.5 14B Instruct", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.35, - "output": 1.4 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "qwq-plus", - "name": "QwQ Plus", - "display_name": "QwQ Plus", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 32768, - "min": 0, - "max": 32768 - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-03-05", - "last_updated": "2025-03-05", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.8, - "output": 2.4 - }, - "type": "chat" - }, + "input": 0, + "output": 0 + } + } + ] + }, + "nova": { + "id": "nova", + "name": "Nova", + "display_name": "Nova", + "api": "https://api.nova.amazon.com/v1", + "doc": "https://nova.amazon.com/dev/documentation", + "models": [ { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3-Coder 30B-A3B Instruct", - "display_name": "Qwen3-Coder 30B-A3B Instruct", + "id": "nova-2-lite-v1", + "name": "Nova 2 Lite", + "display_name": "Nova 2 Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "attachment": true, + "open_weights": false, + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.45, - "output": 2.25 - }, - "type": "chat" + "input": 0, + "output": 0, + "reasoning": 0 + } }, { - "id": "qwen-vl-ocr", - "name": "Qwen Vl Ocr", - "display_name": "Qwen Vl Ocr", + "id": "nova-2-pro-v1", + "name": "Nova 2 Pro", + "display_name": "Nova 2 Pro", "modalities": { "input": [ "text", - "image" + "image", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 34096, - "output": 4096 + "context": 1000000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-10-28", - "last_updated": "2025-04-13", + "release_date": "2026-12-03", + "last_updated": "2026-01-03", "cost": { - "input": 0.72, - "output": 0.72 - }, - "type": "chat" - }, + "input": 0, + "output": 0, + "reasoning": 0 + } + } + ] + }, + "lucidquery": { + "id": "lucidquery", + "name": "LucidQuery AI", + "display_name": "LucidQuery AI", + "api": "https://lucidquery.com/api/v1", + "doc": "https://lucidquery.com/api/docs", + "models": [ { - "id": "qwen2-5-72b-instruct", - "name": "Qwen2.5 72B Instruct", - "display_name": "Qwen2.5 72B Instruct", + "id": "lucidquery-nexus-coder", + "name": "LucidQuery Nexus Coder", + "display_name": "LucidQuery Nexus Coder", "modalities": { "input": [ "text" @@ -1309,68 +1240,70 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 250000, + "output": 60000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-01", + "release_date": "2025-09-01", + "last_updated": "2025-09-01", "cost": { - "input": 1.4, - "output": 5.6 - }, - "type": "chat" + "input": 2, + "output": 5 + } }, { - "id": "qwen3-omni-flash", - "name": "Qwen3-Omni Flash", - "display_name": "Qwen3-Omni Flash", + "id": "lucidnova-rf1-100b", + "name": "LucidNova RF1 100B", + "display_name": "LucidNova RF1 100B", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 120000, + "output": 8000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "knowledge": "2025-09-16", + "release_date": "2024-12-28", + "last_updated": "2025-09-10", "cost": { - "input": 0.43, - "output": 1.66, - "input_audio": 3.81, - "output_audio": 15.11 - }, - "type": "chat" - }, + "input": 2, + "output": 5 + } + } + ] + }, + "moonshot-ai": { + "id": "moonshot-ai", + "name": "Moonshot AI", + "display_name": "Moonshot AI", + "api": "https://api.moonshot.ai/v1", + "doc": "https://platform.moonshot.ai/docs/api/chat", + "models": [ { - "id": "qwen-flash", - "name": "Qwen Flash", - "display_name": "Qwen Flash", + "id": "kimi-k2-thinking-turbo", + "name": "Kimi K2 Thinking Turbo", + "display_name": "Kimi K2 Thinking Turbo", "modalities": { "input": [ "text" @@ -1380,41 +1313,30 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.05, - "output": 0.4 - }, - "type": "chat" + "input": 1.15, + "output": 8, + "cache_read": 0.15 + } }, { - "id": "qwen3-8b", - "name": "Qwen3 8B", - "display_name": "Qwen3 8B", + "id": "kimi-k2-turbo-preview", + "name": "Kimi K2 Turbo", + "display_name": "Kimi K2 Turbo", "modalities": { "input": [ "text" @@ -1424,78 +1346,67 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.18, - "output": 0.7, - "reasoning": 2.1 - }, - "type": "chat" + "input": 2.4, + "output": 10, + "cache_read": 0.6 + } }, { - "id": "qwen3-omni-flash-realtime", - "name": "Qwen3-Omni Flash Realtime", - "display_name": "Qwen3-Omni Flash Realtime", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", "image", - "audio", "video" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.52, - "output": 1.99, - "input_audio": 4.57, - "output_audio": 18.13 - }, - "type": "chat" + "input": 0.6, + "output": 3, + "cache_read": 0.1 + } }, { - "id": "qwen2-5-vl-72b-instruct", - "name": "Qwen2.5-VL 72B Instruct", - "display_name": "Qwen2.5-VL 72B Instruct", + "id": "kimi-k2-0711-preview", + "name": "Kimi K2 0711", + "display_name": "Kimi K2 0711", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -1503,7 +1414,7 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -1512,23 +1423,22 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "knowledge": "2024-10", + "release_date": "2025-07-14", + "last_updated": "2025-07-14", "cost": { - "input": 2.8, - "output": 8.4 - }, - "type": "chat" + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 + } }, { - "id": "qwen3-vl-plus", - "name": "Qwen3 VL Plus", - "display_name": "Qwen3 VL Plus", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -1536,35 +1446,29 @@ }, "limit": { "context": 262144, - "output": 32768 + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.2, - "output": 1.6, - "reasoning": 4.8 - }, - "type": "chat" + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 + } }, { - "id": "qwen-plus", - "name": "Qwen Plus", - "display_name": "Qwen Plus", + "id": "kimi-k2-0905-preview", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ "text" @@ -1574,111 +1478,101 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01-25", - "last_updated": "2025-09-11", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.4, - "output": 1.2, - "reasoning": 4 - }, - "type": "chat" - }, + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 + } + } + ] + }, + "302ai": { + "id": "302ai", + "name": "302.AI", + "display_name": "302.AI", + "api": "https://api.302.ai/v1", + "doc": "https://doc.302.ai", + "models": [ { - "id": "qwen2-5-32b-instruct", - "name": "Qwen2.5 32B Instruct", - "display_name": "Qwen2.5 32B Instruct", + "id": "gpt-4.1-nano", + "name": "gpt-4.1-nano", + "display_name": "gpt-4.1-nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, + "attachment": true, + "open_weights": false, "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.7, - "output": 2.8 - }, - "type": "chat" + "input": 0.1, + "output": 0.4 + } }, { - "id": "qwen2-5-omni-7b", - "name": "Qwen2.5-Omni 7B", - "display_name": "Qwen2.5-Omni 7B", + "id": "doubao-seed-code-preview-251028", + "name": "doubao-seed-code-preview-251028", + "display_name": "doubao-seed-code-preview-251028", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-12", - "last_updated": "2024-12", + "attachment": true, + "open_weights": false, + "release_date": "2025-11-11", + "last_updated": "2025-11-11", "cost": { - "input": 0.1, - "output": 0.4, - "input_audio": 6.76 - }, - "type": "chat" + "input": 0.17, + "output": 1.14 + } }, { - "id": "qwen-max", - "name": "Qwen Max", - "display_name": "Qwen Max", + "id": "glm-4.7", + "name": "glm-4.7", + "display_name": "glm-4.7", "modalities": { "input": [ "text" @@ -1688,79 +1582,71 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-04-03", - "last_updated": "2025-01-25", + "knowledge": "2025-06", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 1.6, - "output": 6.4 - }, - "type": "chat" + "input": 0.286, + "output": 1.142 + } }, { - "id": "qwen2-5-7b-instruct", - "name": "Qwen2.5 7B Instruct", - "display_name": "Qwen2.5 7B Instruct", + "id": "grok-4-fast-non-reasoning", + "name": "grok-4-fast-non-reasoning", + "display_name": "grok-4-fast-non-reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "attachment": true, + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.175, - "output": 0.7 - }, - "type": "chat" - }, + "input": 0.2, + "output": 0.5 + } + }, { - "id": "qwen2-5-vl-7b-instruct", - "name": "Qwen2.5-VL 7B Instruct", - "display_name": "Qwen2.5-VL 7B Instruct", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "qwen3-235b-a22b-instruct-2507", + "display_name": "qwen3-235b-a22b-instruct-2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -1768,128 +1654,116 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", "cost": { - "input": 0.35, - "output": 1.05 - }, - "type": "chat" + "input": 0.29, + "output": 1.143 + } }, { - "id": "qwen3-235b-a22b", - "name": "Qwen3 235B A22B", - "display_name": "Qwen3 235B A22B", + "id": "grok-4-fast-reasoning", + "name": "grok-4-fast-reasoning", + "display_name": "grok-4-fast-reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "attachment": true, + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.7, - "output": 2.8, - "reasoning": 8.4 - }, - "type": "chat" + "input": 0.2, + "output": 0.5 + } }, { - "id": "qwen-omni-turbo-realtime", - "name": "Qwen-Omni Turbo Realtime", - "display_name": "Qwen-Omni Turbo Realtime", + "id": "mistral-large-2512", + "name": "mistral-large-2512", + "display_name": "mistral-large-2512", "modalities": { "input": [ "text", - "image", - "audio" + "image" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 128000, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-05-08", - "last_updated": "2025-05-08", + "knowledge": "2024-12", + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "cost": { - "input": 0.27, - "output": 1.07, - "input_audio": 4.44, - "output_audio": 8.89 - }, - "type": "chat" + "input": 1.1, + "output": 3.3 + } }, { - "id": "qwen-mt-turbo", - "name": "Qwen Mt Turbo", - "display_name": "Qwen Mt Turbo", + "id": "gemini-3-flash-preview", + "name": "gemini-3-flash-preview", + "display_name": "gemini-3-flash-preview", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 1000000, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01", - "last_updated": "2025-01", + "knowledge": "2025-06", + "release_date": "2025-12-18", + "last_updated": "2025-12-18", "cost": { - "input": 0.16, - "output": 0.49 - }, - "type": "chat" + "input": 0.5, + "output": 3 + } }, { - "id": "qwen3-coder-480b-a35b-instruct", - "name": "Qwen3-Coder 480B-A35B Instruct", - "display_name": "Qwen3-Coder 480B-A35B Instruct", + "id": "MiniMax-M2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ "text" @@ -1899,8 +1773,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -1908,20 +1782,51 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": false, + "release_date": "2025-10-26", + "last_updated": "2025-10-26", "cost": { - "input": 1.5, - "output": 7.5 + "input": 0.33, + "output": 1.32 + } + }, + { + "id": "grok-4-1-fast-reasoning", + "name": "grok-4-1-fast-reasoning", + "display_name": "grok-4-1-fast-reasoning", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] }, - "type": "chat" + "limit": { + "context": 2000000, + "output": 30000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-11-20", + "last_updated": "2025-11-20", + "cost": { + "input": 0.2, + "output": 0.5 + } }, { - "id": "qwen-mt-plus", - "name": "Qwen Mt Plus", - "display_name": "Qwen Mt Plus", + "id": "deepseek-v3.2-thinking", + "name": "DeepSeek-V3.2-Thinking", + "display_name": "DeepSeek-V3.2-Thinking", "modalities": { "input": [ "text" @@ -1931,61 +1836,61 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01", - "last_updated": "2025-01", + "knowledge": "2024-12", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 2.46, - "output": 7.37 - }, - "type": "chat" + "input": 0.29, + "output": 0.43 + } }, { - "id": "qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "ministral-14b-2512", + "name": "ministral-14b-2512", + "display_name": "ministral-14b-2512", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "knowledge": "2024-12", + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "cost": { - "input": 1.2, - "output": 6 - }, - "type": "chat" + "input": 0.33, + "output": 0.33 + } }, { - "id": "qwen3-coder-plus", - "name": "Qwen3 Coder Plus", - "display_name": "Qwen3 Coder Plus", + "id": "glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ "text" @@ -1995,8 +1900,8 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 128000, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -2004,58 +1909,52 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "cost": { - "input": 1, - "output": 5 - }, - "type": "chat" + "input": 0.286, + "output": 1.142 + } }, { - "id": "qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen3 Next 80B A3B Thinking", + "id": "gpt-5-thinking", + "name": "gpt-5-thinking", + "display_name": "gpt-5-thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 400000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09", - "last_updated": "2025-09", + "attachment": true, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 0.5, - "output": 6 - }, - "type": "chat" + "input": 1.25, + "output": 10 + } }, { - "id": "qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "kimi-k2-thinking-turbo", + "name": "kimi-k2-thinking-turbo", + "display_name": "kimi-k2-thinking-turbo", "modalities": { "input": [ "text" @@ -2065,36 +1964,29 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.7, - "output": 2.8, - "reasoning": 8.4 - }, - "type": "chat" + "input": 1.265, + "output": 9.119 + } }, { - "id": "qwen-vl-plus", - "name": "Qwen-VL Plus", - "display_name": "Qwen-VL Plus", + "id": "gemini-2.5-flash-image", + "name": "gemini-2.5-flash-image", + "display_name": "gemini-2.5-flash-image", "modalities": { "input": [ "text", @@ -2105,29 +1997,28 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01-25", - "last_updated": "2025-08-15", + "knowledge": "2025-01", + "release_date": "2025-10-08", + "last_updated": "2025-10-08", "cost": { - "input": 0.21, - "output": 0.63 - }, - "type": "chat" + "input": 0.3, + "output": 30 + } }, { - "id": "qwen3-coder-plus-2025-09-23", - "name": "Qwen3 Coder Plus 2025 09 23", - "display_name": "Qwen3 Coder Plus 2025 09 23", + "id": "deepseek-chat", + "name": "Deepseek-Chat", + "display_name": "Deepseek-Chat", "modalities": { "input": [ "text" @@ -2137,8 +2028,8 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -2146,15 +2037,23 @@ "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2024-11-29", + "last_updated": "2024-11-29", + "cost": { + "input": 0.29, + "output": 0.43 + } }, { - "id": "qwen3-coder-plus-2025-07-22", - "name": "Qwen3 Coder Plus 2025 07 22", - "display_name": "Qwen3 Coder Plus 2025 07 22", + "id": "gemini-3-pro-preview", + "name": "gemini-3-pro-preview", + "display_name": "gemini-3-pro-preview", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -2162,20 +2061,27 @@ }, "limit": { "context": 1000000, - "output": 65536 + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", + "cost": { + "input": 2, + "output": 12 + } }, { - "id": "qwen-vl-ocr-latest", - "name": "Qwen Vl Ocr Latest", - "display_name": "Qwen Vl Ocr Latest", + "id": "gemini-2.5-flash", + "name": "gemini-2.5-flash", + "display_name": "gemini-2.5-flash", "modalities": { "input": [ "text", @@ -2186,21 +2092,28 @@ ] }, "limit": { - "context": 34096, - "output": 4096 + "context": 1000000, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "cost": { + "input": 0.3, + "output": 2.5 + } }, { - "id": "qvq-max-2025-05-15", - "name": "Qvq Max 2025 05 15", - "display_name": "Qvq Max 2025 05 15", + "id": "gpt-4.1-mini", + "name": "gpt-4.1-mini", + "display_name": "gpt-4.1-mini", "modalities": { "input": [ "text", @@ -2211,37 +2124,39 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 16384, - "min": 0, - "max": 16384 - } + "supported": false }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 0.4, + "output": 1.6 + } }, { - "id": "qwen-long", - "name": "Qwen Long", - "display_name": "Qwen Long", + "id": "gemini-2.0-flash-lite", + "name": "gemini-2.0-flash-lite", + "display_name": "gemini-2.0-flash-lite", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 2000000, "output": 8192 }, "temperature": true, @@ -2249,74 +2164,86 @@ "reasoning": { "supported": false }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2025-06-16", + "last_updated": "2025-06-16", + "cost": { + "input": 0.075, + "output": 0.3 + } }, { - "id": "qwen-turbo-latest", - "name": "Qwen Turbo Latest", - "display_name": "Qwen Turbo Latest", + "id": "claude-sonnet-4-5-20250929-thinking", + "name": "claude-sonnet-4-5-20250929-thinking", + "display_name": "claude-sonnet-4-5-20250929-thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-03", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", + "cost": { + "input": 3, + "output": 15 + } }, { - "id": "qwen-turbo-2024-09-19", - "name": "Qwen Turbo 2024 09 19", - "display_name": "Qwen Turbo 2024 09 19", + "id": "claude-opus-4-5-20251101", + "name": "claude-opus-4-5-20251101", + "display_name": "claude-opus-4-5-20251101", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "type": "chat" - }, - { - "id": "qwen-flash-2025-07-28", - "name": "Qwen Flash 2025 07 28", - "display_name": "Qwen Flash 2025 07 28", - "modalities": { + "attachment": true, + "open_weights": false, + "knowledge": "2025-03", + "release_date": "2025-11-25", + "last_updated": "2025-11-25", + "cost": { + "input": 5, + "output": 25 + } + }, + { + "id": "qwen3-max-2025-09-23", + "name": "qwen3-max-2025-09-23", + "display_name": "qwen3-max-2025-09-23", + "modalities": { "input": [ "text" ], @@ -2325,129 +2252,124 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 258048, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", + "cost": { + "input": 0.86, + "output": 3.43 + } }, { - "id": "qwen-plus-latest", - "name": "Qwen Plus Latest", - "display_name": "Qwen Plus Latest", + "id": "claude-sonnet-4-5-20250929", + "name": "claude-sonnet-4-5-20250929", + "display_name": "claude-sonnet-4-5-20250929", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "supported": false }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-03", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "cost": { + "input": 3, + "output": 15 + } }, { - "id": "qwen-plus-2024-09-19", - "name": "Qwen Plus 2024 09 19", - "display_name": "Qwen Plus 2024 09 19", + "id": "grok-4.1", + "name": "grok-4.1", + "display_name": "grok-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "cost": { + "input": 2, + "output": 10 + } }, { - "id": "qwen-plus-2025-07-14", - "name": "Qwen Plus 2025 07 14", - "display_name": "Qwen Plus 2025 07 14", + "id": "chatgpt-4o-latest", + "name": "chatgpt-4o-latest", + "display_name": "chatgpt-4o-latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 128000, "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "supported": false }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-08-08", + "last_updated": "2024-08-08", + "cost": { + "input": 5, + "output": 15 + } }, { - "id": "qwen-plus-2025-09-11", - "name": "Qwen Plus 2025 09 11", - "display_name": "Qwen Plus 2025 09 11", + "id": "kimi-k2-thinking", + "name": "kimi-k2-thinking", + "display_name": "kimi-k2-thinking", "modalities": { "input": [ "text" @@ -2457,117 +2379,124 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true }, "attachment": false, - "type": "chat" + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "cost": { + "input": 0.575, + "output": 2.3 + } }, { - "id": "qwen-max-latest", - "name": "Qwen Max Latest", - "display_name": "Qwen Max Latest", + "id": "gpt-5.2-chat-latest", + "name": "gpt-5.2-chat-latest", + "display_name": "gpt-5.2-chat-latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-12-12", + "last_updated": "2025-12-12", + "cost": { + "input": 1.75, + "output": 14 + } }, { - "id": "qwen-max-2024-09-19", - "name": "Qwen Max 2024 09 19", - "display_name": "Qwen Max 2024 09 19", + "id": "gpt-5.1", + "name": "gpt-5.1", + "display_name": "gpt-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "cost": { + "input": 1.25, + "output": 10 + } }, { - "id": "qwen-max-2024-04-28", - "name": "Qwen Max 2024 04 28", - "display_name": "Qwen Max 2024 04 28", + "id": "doubao-seed-1-6-vision-250815", + "name": "doubao-seed-1-6-vision-250815", + "display_name": "doubao-seed-1-6-vision-250815", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8000, - "output": 2000 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-09-30", + "last_updated": "2025-09-30", + "cost": { + "input": 0.114, + "output": 1.143 + } }, { - "id": "qwen-max-2024-04-03", - "name": "Qwen Max 2024 04 03", - "display_name": "Qwen Max 2024 04 03", + "id": "qwen-flash", + "name": "Qwen-Flash", + "display_name": "Qwen-Flash", "modalities": { "input": [ "text" @@ -2577,8 +2506,8 @@ ] }, "limit": { - "context": 8000, - "output": 2000 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -2586,42 +2515,50 @@ "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "cost": { + "input": 0.022, + "output": 0.22 + } }, { - "id": "qwen-max-2025-01-25", - "name": "Qwen Max 2025 01 25", - "display_name": "Qwen Max 2025 01 25", + "id": "gemini-3-pro-image-preview", + "name": "gemini-3-pro-image-preview", + "display_name": "gemini-3-pro-image-preview", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32768, + "output": 64000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-11-20", + "last_updated": "2025-11-20", + "cost": { + "input": 2, + "output": 120 + } }, { - "id": "qwen3-max-2025-09-23", - "name": "Qwen3 Max 20250923", - "display_name": "Qwen3 Max 20250923", + "id": "kimi-k2-0905-preview", + "name": "kimi-k2-0905-preview", + "display_name": "kimi-k2-0905-preview", "modalities": { "input": [ "text" @@ -2632,96 +2569,102 @@ }, "limit": { "context": 262144, - "output": 65536 + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, - "type": "chat" + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "cost": { + "input": 0.632, + "output": 2.53 + } }, { - "id": "qwen3-max-preview", - "name": "Qwen3 Max Preview", - "display_name": "Qwen3 Max Preview", + "id": "gpt-4o", + "name": "gpt-4o", + "display_name": "gpt-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", + "cost": { + "input": 2.5, + "output": 10 + } }, { - "id": "qwen3-235b-a22b-thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "doubao-seed-1-6-thinking-250715", + "name": "doubao-seed-1-6-thinking-250715", + "display_name": "doubao-seed-1-6-thinking-250715", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 256000, + "output": 16000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-07-15", + "last_updated": "2025-07-15", + "cost": { + "input": 0.121, + "output": 1.21 + } }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "gpt-4.1", + "name": "gpt-4.1", + "display_name": "gpt-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 1000000, "output": 32768 }, "temperature": true, @@ -2729,13 +2672,20 @@ "reasoning": { "supported": false }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 2, + "output": 8 + } }, { - "id": "qwen3-30b-a3b-instruct-2507", - "name": "Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen3 30B A3B Instruct 2507", + "id": "qwen-plus", + "name": "Qwen-Plus", + "display_name": "Qwen-Plus", "modalities": { "input": [ "text" @@ -2745,7 +2695,7 @@ ] }, "limit": { - "context": 131072, + "context": 1000000, "output": 32768 }, "temperature": true, @@ -2754,42 +2704,51 @@ "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 0.12, + "output": 1.2 + } }, { - "id": "qwen3-30b-a3b-thinking-2507", - "name": "Qwen3 30B A3B Thinking 2507", - "display_name": "Qwen3 30B A3B Thinking 2507", + "id": "glm-4.5v", + "name": "GLM-4.5V", + "display_name": "GLM-4.5V", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 64000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "supported": false }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", + "cost": { + "input": 0.29, + "output": 0.86 + } }, { - "id": "qwen3-30b-a3b", - "name": "Qwen3 30B A3B", - "display_name": "Qwen3 30B A3B", + "id": "glm-4.6", + "name": "glm-4.6", + "display_name": "glm-4.6", "modalities": { "input": [ "text" @@ -2799,148 +2758,186 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "knowledge": "2025-03", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", + "cost": { + "input": 0.286, + "output": 1.142 + } }, { - "id": "qwen3-4b", - "name": "Qwen3 4B", - "display_name": "Qwen3 4B", + "id": "gemini-2.5-flash-preview-09-2025", + "name": "gemini-2.5-flash-preview-09-2025", + "display_name": "gemini-2.5-flash-preview-09-2025", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "supported": false }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-26", + "last_updated": "2025-09-26", + "cost": { + "input": 0.3, + "output": 2.5 + } }, { - "id": "qwen3-1.7b", - "name": "Qwen3 1.7B", - "display_name": "Qwen3 1.7B", + "id": "gpt-5-mini", + "name": "gpt-5-mini", + "display_name": "gpt-5-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 30720, - "min": 0, - "max": 30720 - } + "supported": false }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", + "cost": { + "input": 0.25, + "output": 2 + } }, { - "id": "qwen3-0.6b", - "name": "Qwen3 0.6B", - "display_name": "Qwen3 0.6B", + "id": "claude-opus-4-1-20250805-thinking", + "name": "claude-opus-4-1-20250805-thinking", + "display_name": "claude-opus-4-1-20250805-thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 30720, - "min": 0, - "max": 30720 - } + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03", + "release_date": "2025-05-27", + "last_updated": "2025-05-27", + "cost": { + "input": 15, + "output": 75 + } + }, + { + "id": "qwen3-235b-a22b", + "name": "Qwen3-235B-A22B", + "display_name": "Qwen3-235B-A22B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", + "cost": { + "input": 0.29, + "output": 2.86 + } }, { - "id": "qwen3-vl-plus-2025-09-23", - "name": "Qwen3 VL Plus 2025 09 23", - "display_name": "Qwen3 VL Plus 2025 09 23", + "id": "MiniMax-M1", + "name": "MiniMax-M1", + "display_name": "MiniMax-M1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 1000000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "release_date": "2025-06-16", + "last_updated": "2025-06-16", + "cost": { + "input": 0.132, + "output": 1.254 + } }, { - "id": "qwq-plus-latest", - "name": "QwQ Plus Latest", - "display_name": "QwQ Plus Latest", + "id": "deepseek-reasoner", + "name": "Deepseek-Reasoner", + "display_name": "Deepseek-Reasoner", "modalities": { "input": [ "text" @@ -2950,38 +2947,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 32768, - "min": 0, - "max": 32768 - } - }, - "search": { - "supported": false + "default": true }, "attachment": false, - "type": "chat" - } - ] - }, - "xai": { - "id": "xai", - "name": "xai", - "display_name": "xai", - "doc": "https://docs.x.ai/docs/models", - "models": [ + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", + "cost": { + "input": 0.29, + "output": 0.43 + } + }, { - "id": "grok-4-fast-non-reasoning", - "name": "Grok 4 Fast (Non-Reasoning)", - "display_name": "Grok 4 Fast (Non-Reasoning)", + "id": "gemini-2.5-pro", + "name": "gemini-2.5-pro", + "display_name": "gemini-2.5-pro", "modalities": { "input": [ "text", @@ -2992,8 +2980,8 @@ ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -3002,20 +2990,18 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 - }, - "type": "chat" + "input": 1.25, + "output": 10 + } }, { - "id": "grok-3-fast", - "name": "Grok 3 Fast", - "display_name": "Grok 3 Fast", + "id": "qwen-max-latest", + "name": "Qwen-Max-Latest", + "display_name": "Qwen-Max-Latest", "modalities": { "input": [ "text" @@ -3036,19 +3022,17 @@ "attachment": false, "open_weights": false, "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "release_date": "2024-04-03", + "last_updated": "2025-01-25", "cost": { - "input": 5, - "output": 25, - "cache_read": 1.25 - }, - "type": "chat" + "input": 0.343, + "output": 1.372 + } }, { - "id": "grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "qwen3-coder-480b-a35b-instruct", + "name": "qwen3-coder-480b-a35b-instruct", + "display_name": "qwen3-coder-480b-a35b-instruct", "modalities": { "input": [ "text" @@ -3058,32 +3042,28 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 3, - "output": 15, - "reasoning": 15, - "cache_read": 0.75 - }, - "type": "chat" + "input": 0.86, + "output": 3.43 + } }, { - "id": "grok-2-vision", - "name": "Grok 2 Vision", - "display_name": "Grok 2 Vision", + "id": "gpt-5", + "name": "gpt-5", + "display_name": "gpt-5", "modalities": { "input": [ "text", @@ -3094,8 +3074,8 @@ ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -3104,20 +3084,18 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "knowledge": "2024-10", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 2, - "output": 10, - "cache_read": 2 - }, - "type": "chat" + "input": 1.25, + "output": 10 + } }, { - "id": "grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "qwen3-30b-a3b", + "name": "Qwen3-30B-A3B", + "display_name": "Qwen3-30B-A3B", "modalities": { "input": [ "text" @@ -3127,31 +3105,28 @@ ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2023-10", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "knowledge": "2025-04", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 - }, - "type": "chat" + "input": 0.11, + "output": 1.08 + } }, { - "id": "grok-2", - "name": "Grok 2", - "display_name": "Grok 2", + "id": "deepseek-v3.2", + "name": "deepseek-v3.2", + "display_name": "deepseek-v3.2", "modalities": { "input": [ "text" @@ -3161,7 +3136,7 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, "temperature": true, @@ -3171,20 +3146,18 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "knowledge": "2024-12", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 2, - "output": 10, - "cache_read": 2 - }, - "type": "chat" + "input": 0.29, + "output": 0.43 + } }, { - "id": "grok-3-mini-fast-latest", - "name": "Grok 3 Mini Fast Latest", - "display_name": "Grok 3 Mini Fast Latest", + "id": "MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" @@ -3194,32 +3167,27 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "release_date": "2025-12-19", + "last_updated": "2025-12-19", "cost": { - "input": 0.6, - "output": 4, - "reasoning": 4, - "cache_read": 0.15 - }, - "type": "chat" + "input": 0.3, + "output": 1.2 + } }, { - "id": "grok-2-vision-1212", - "name": "Grok 2 Vision 1212", - "display_name": "Grok 2 Vision 1212", + "id": "gemini-2.5-flash-lite-preview-09-2025", + "name": "gemini-2.5-flash-lite-preview-09-2025", + "display_name": "gemini-2.5-flash-lite-preview-09-2025", "modalities": { "input": [ "text", @@ -3230,66 +3198,60 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 1000000, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "search": { - "supported": false - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-20", - "last_updated": "2024-12-12", + "knowledge": "2025-01", + "release_date": "2025-09-26", + "last_updated": "2025-09-26", "cost": { - "input": 2, - "output": 10, - "cache_read": 2 - }, - "type": "chat" + "input": 0.1, + "output": 0.4 + } }, { - "id": "grok-3", - "name": "Grok 3", - "display_name": "Grok 3", + "id": "grok-4-1-fast-non-reasoning", + "name": "grok-4-1-fast-non-reasoning", + "display_name": "grok-4-1-fast-non-reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2025-06", + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 - }, - "type": "chat" + "input": 0.2, + "output": 0.5 + } }, { - "id": "grok-4-fast", - "name": "Grok 4 Fast", - "display_name": "Grok 4 Fast", + "id": "doubao-seed-1-8-251215", + "name": "doubao-seed-1-8-251215", + "display_name": "doubao-seed-1-8-251215", "modalities": { "input": [ "text", @@ -3300,64 +3262,59 @@ ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 224000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "release_date": "2025-12-18", + "last_updated": "2025-12-18", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 - }, - "type": "chat" + "input": 0.114, + "output": 0.286 + } }, { - "id": "grok-2-latest", - "name": "Grok 2 Latest", - "display_name": "Grok 2 Latest", + "id": "gpt-5-pro", + "name": "gpt-5-pro", + "display_name": "gpt-5-pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 272000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-20", - "last_updated": "2024-12-12", + "knowledge": "2024-10", + "release_date": "2025-10-08", + "last_updated": "2025-10-08", "cost": { - "input": 2, - "output": 10, - "cache_read": 2 - }, - "type": "chat" + "input": 15, + "output": 120 + } }, { - "id": "grok-4-1-fast", - "name": "Grok 4.1 Fast", - "display_name": "Grok 4.1 Fast", + "id": "gemini-2.5-flash-nothink", + "name": "gemini-2.5-flash-nothink", + "display_name": "gemini-2.5-flash-nothink", "modalities": { "input": [ "text", @@ -3368,133 +3325,124 @@ ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "knowledge": "2025-01", + "release_date": "2025-06-24", + "last_updated": "2025-06-24", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 - }, - "type": "chat" + "input": 0.3, + "output": 2.5 + } }, { - "id": "grok-2-1212", - "name": "Grok 2 1212", - "display_name": "Grok 2 1212", + "id": "claude-opus-4-1-20250805", + "name": "claude-opus-4-1-20250805", + "display_name": "claude-opus-4-1-20250805", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 120000, - "output": 100000 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "search": { - "supported": false - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-12-12", - "last_updated": "2024-12-12", + "knowledge": "2025-03", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 2, - "output": 10, - "cache_read": 2 - }, - "type": "chat" + "input": 15, + "output": 75 + } }, { - "id": "grok-3-fast-latest", - "name": "Grok 3 Fast Latest", - "display_name": "Grok 3 Fast Latest", + "id": "gpt-5.2", + "name": "gpt-5.2", + "display_name": "gpt-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2024-10", + "release_date": "2025-12-12", + "last_updated": "2025-12-12", "cost": { - "input": 5, - "output": 25, - "cache_read": 1.25 - }, - "type": "chat" + "input": 1.75, + "output": 14 + } }, { - "id": "grok-3-latest", - "name": "Grok 3 Latest", - "display_name": "Grok 3 Latest", + "id": "gpt-5.1-chat-latest", + "name": "gpt-5.1-chat-latest", + "display_name": "gpt-5.1-chat-latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2024-10", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 - }, - "type": "chat" + "input": 1.25, + "output": 10 + } }, { - "id": "grok-2-vision-latest", - "name": "Grok 2 Vision Latest", - "display_name": "Grok 2 Vision Latest", + "id": "glm-4.6v", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ "text", @@ -3505,8 +3453,8 @@ ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -3515,20 +3463,18 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-20", - "last_updated": "2024-12-12", + "knowledge": "2025-03", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 2, - "output": 10, - "cache_read": 2 - }, - "type": "chat" + "input": 0.145, + "output": 0.43 + } }, { - "id": "grok-vision-beta", - "name": "Grok Vision Beta", - "display_name": "Grok Vision Beta", + "id": "claude-opus-4-5-20251101-thinking", + "name": "claude-opus-4-5-20251101-thinking", + "display_name": "claude-opus-4-5-20251101-thinking", "modalities": { "input": [ "text", @@ -3539,65 +3485,70 @@ ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "knowledge": "2025-03", + "release_date": "2025-11-25", + "last_updated": "2025-11-25", "cost": { "input": 5, - "output": 15, - "cache_read": 5 - }, - "type": "chat" + "output": 25 + } }, { - "id": "grok-3-mini", - "name": "Grok 3 Mini", - "display_name": "Grok 3 Mini", + "id": "claude-haiku-4-5-20251001", + "name": "claude-haiku-4-5-20251001", + "display_name": "claude-haiku-4-5-20251001", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2025-03", + "release_date": "2025-10-16", + "last_updated": "2025-10-16", "cost": { - "input": 0.3, - "output": 0.5, - "reasoning": 0.5, - "cache_read": 0.075 - }, - "type": "chat" - }, + "input": 1, + "output": 5 + } + } + ] + }, + "zai-coding-plan": { + "id": "zai-coding-plan", + "name": "Z.AI Coding Plan", + "display_name": "Z.AI Coding Plan", + "api": "https://api.z.ai/api/coding/paas/v4", + "doc": "https://docs.z.ai/devpack/overview", + "models": [ { - "id": "grok-beta", - "name": "Grok Beta", - "display_name": "Grok Beta", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -3607,30 +3558,31 @@ ] }, "limit": { - "context": 131072, - "output": 4096 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 5, - "output": 15, - "cache_read": 5 - }, - "type": "chat" + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } }, { - "id": "grok-3-mini-latest", - "name": "Grok 3 Mini Latest", - "display_name": "Grok 3 Mini Latest", + "id": "glm-4.5-flash", + "name": "GLM-4.5-Flash", + "display_name": "GLM-4.5-Flash", "modalities": { "input": [ "text" @@ -3641,7 +3593,7 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 98304 }, "temperature": true, "tool_call": true, @@ -3650,56 +3602,55 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.3, - "output": 0.5, - "reasoning": 0.5, - "cache_read": 0.075 - }, - "type": "chat" + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } }, { - "id": "grok-4-1-fast-non-reasoning", - "name": "Grok 4.1 Fast (Non-Reasoning)", - "display_name": "Grok 4.1 Fast (Non-Reasoning)", + "id": "glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 - }, - "type": "chat" + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } }, { - "id": "grok-3-mini-fast", - "name": "Grok 3 Mini Fast", - "display_name": "Grok 3 Mini Fast", + "id": "glm-4.7-flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ "text" @@ -3709,8 +3660,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -3719,22 +3670,21 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.6, - "output": 4, - "reasoning": 4, - "cache_read": 0.15 - }, - "type": "chat" + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } }, { - "id": "grok-3-mini-fast-beta", - "name": "Grok 3 Mini Fast Beta", - "display_name": "Grok 3 Mini Fast Beta", + "id": "glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ "text" @@ -3744,55 +3694,65 @@ ] }, "limit": { - "context": 120000, - "output": 100000 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "effort": "low" - }, - "search": { - "supported": false + "default": true }, "attachment": false, - "type": "chat" + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } }, { - "id": "grok-3-mini-beta", - "name": "Grok 3 Mini Beta", - "display_name": "Grok 3 Mini Beta", + "id": "glm-4.5v", + "name": "GLM-4.5V", + "display_name": "GLM-4.5V", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 120000, - "output": 100000 + "context": 64000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "effort": "low" - }, - "search": { - "supported": false + "default": true }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "grok-3-fast-beta", - "name": "Grok 3 Fast Beta", - "display_name": "Grok 3 Fast Beta", + "id": "glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" @@ -3802,52 +3762,74 @@ ] }, "limit": { - "context": 120000, - "output": 100000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "search": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "type": "chat" + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } }, { - "id": "grok-2-image-1212", - "name": "Grok 2 Image 1212", - "display_name": "Grok 2 Image 1212", + "id": "glm-4.6v", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 130000, - "output": 100000 + "context": 128000, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false - }, - "search": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "type": "chat" - }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", + "cost": { + "input": 0, + "output": 0 + } + } + ] + }, + "xiaomi": { + "id": "xiaomi", + "name": "Xiaomi", + "display_name": "Xiaomi", + "api": "https://api.xiaomimimo.com/v1", + "doc": "https://platform.xiaomimimo.com/#/docs", + "models": [ { - "id": "grok-3-beta", - "name": "Grok 3 Beta", - "display_name": "Grok 3 Beta", + "id": "mimo-v2-flash", + "name": "MiMo-V2-Flash", + "display_name": "MiMo-V2-Flash", "modalities": { "input": [ "text" @@ -3857,109 +3839,121 @@ ] }, "limit": { - "context": 120000, - "output": 100000 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "search": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "type": "chat" + "open_weights": true, + "knowledge": "2024-12-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", + "cost": { + "input": 0.07, + "output": 0.21 + } } ] }, - "vultr": { - "id": "vultr", - "name": "Vultr", - "display_name": "Vultr", - "api": "https://api.vultrinference.com/v1", - "doc": "https://api.vultrinference.com/", + "alibaba": { + "id": "alibaba", + "name": "alibaba", + "display_name": "alibaba", + "api": "https://dashscope-intl.aliyuncs.com/compatible-mode/v1", + "doc": "https://www.alibabacloud.com/help/en/model-studio/models", "models": [ { - "id": "deepseek-r1-distill-qwen-32b", - "name": "DeepSeek R1 Distill Qwen 32B", - "display_name": "DeepSeek R1 Distill Qwen 32B", + "id": "qwen3-livetranslate-flash-realtime", + "name": "Qwen3-LiveTranslate Flash Realtime", + "display_name": "Qwen3-LiveTranslate Flash Realtime", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 121808, - "output": 8192 + "context": 53248, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 0.2, - "output": 0.2 - }, - "type": "chat" + "input": 10, + "output": 10, + "input_audio": 10, + "output_audio": 38 + } }, { - "id": "qwen2.5-coder-32b-instruct", - "name": "Qwen2.5 Coder 32B Instruct", - "display_name": "Qwen2.5 Coder 32B Instruct", + "id": "qwen3-asr-flash", + "name": "Qwen3-ASR Flash", + "display_name": "Qwen3-ASR Flash", "modalities": { "input": [ - "text" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 12952, - "output": 2048 + "context": 53248, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-11-06", - "last_updated": "2024-11-06", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-09-08", + "last_updated": "2025-09-08", "cost": { - "input": 0.2, - "output": 0.2 - }, - "type": "chat" + "input": 0.035, + "output": 0.035 + } }, { - "id": "kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "qwen-omni-turbo", + "name": "Qwen-Omni Turbo", + "display_name": "Qwen-Omni Turbo", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 58904, - "output": 4096 + "context": 32768, + "output": 2048 }, "temperature": true, "tool_call": true, @@ -3967,53 +3961,53 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01-19", + "last_updated": "2025-03-26", "cost": { - "input": 0.2, - "output": 0.2 - }, - "type": "chat" + "input": 0.07, + "output": 0.27, + "input_audio": 4.44, + "output_audio": 8.89 + } }, { - "id": "deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "qwen-vl-max", + "name": "Qwen-VL Max", + "display_name": "Qwen-VL Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 121808, + "context": 131072, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-04-08", + "last_updated": "2025-08-13", "cost": { - "input": 0.2, - "output": 0.2 - }, - "type": "chat" + "input": 0.8, + "output": 3.2 + } }, { - "id": "gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ "text" @@ -4023,8 +4017,8 @@ ] }, "limit": { - "context": 121808, - "output": 8192 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -4033,28 +4027,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-06-23", - "last_updated": "2025-06-23", + "knowledge": "2025-04", + "release_date": "2025-09", + "last_updated": "2025-09", "cost": { - "input": 0.2, - "output": 0.2 - }, - "type": "chat" - } - ] - }, - "nvidia": { - "id": "nvidia", - "name": "Nvidia", - "display_name": "Nvidia", - "api": "https://integrate.api.nvidia.com/v1", - "doc": "https://docs.api.nvidia.com/nim/", - "models": [ + "input": 0.5, + "output": 2 + } + }, { - "id": "moonshotai/kimi-k2-instruct-0905", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "qwen-turbo", + "name": "Qwen Turbo", + "display_name": "Qwen Turbo", "modalities": { "input": [ "text" @@ -4064,40 +4048,53 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-11-01", + "last_updated": "2025-04-28", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.05, + "output": 0.2, + "reasoning": 0.5 + } }, { - "id": "moonshotai/kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "qwen3-vl-235b-a22b", + "name": "Qwen3-VL 235B-A22B", + "display_name": "Qwen3-VL 235B-A22B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -4107,21 +4104,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-11", - "last_updated": "2025-12", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, - "type": "chat" + "input": 0.7, + "output": 2.8, + "reasoning": 8.4 + } }, { - "id": "moonshotai/kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "qwen3-coder-flash", + "name": "Qwen3 Coder Flash", + "display_name": "Qwen3 Coder Flash", "modalities": { "input": [ "text" @@ -4131,33 +4126,32 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-01", - "release_date": "2025-01-01", - "last_updated": "2025-09-05", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.3, + "output": 1.5 + } }, { - "id": "nvidia/nvidia-nemotron-nano-9b-v2", - "name": "nvidia-nemotron-nano-9b-v2", - "display_name": "nvidia-nemotron-nano-9b-v2", + "id": "qwen3-vl-30b-a3b", + "name": "Qwen3-VL 30B-A3B", + "display_name": "Qwen3-VL 30B-A3B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -4165,7 +4159,7 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -4175,24 +4169,22 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-09", - "release_date": "2025-08-18", - "last_updated": "2025-08-18", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.2, + "output": 0.8, + "reasoning": 2.4 + } }, { - "id": "nvidia/cosmos-nemotron-34b", - "name": "Cosmos Nemotron 34B", - "display_name": "Cosmos Nemotron 34B", + "id": "qwen3-14b", + "name": "Qwen3 14B", + "display_name": "Qwen3 14B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" @@ -4203,58 +4195,64 @@ "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-05", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.35, + "output": 1.4, + "reasoning": 4.2 + } }, { - "id": "nvidia/llama-embed-nemotron-8b", - "name": "Llama Embed Nemotron 8B", - "display_name": "Llama Embed Nemotron 8B", + "id": "qvq-max", + "name": "QVQ Max", + "display_name": "QVQ Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 131072, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-03-18", - "last_updated": "2025-03-18", + "knowledge": "2024-04", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 1.2, + "output": 4.8 + } }, { - "id": "nvidia/nemotron-3-nano-30b-a3b", - "name": "nemotron-3-nano-30b-a3b", - "display_name": "nemotron-3-nano-30b-a3b", + "id": "qwen-plus-character-ja", + "name": "Qwen Plus Character (Japanese)", + "display_name": "Qwen Plus Character (Japanese)", "modalities": { "input": [ "text" @@ -4264,94 +4262,102 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 8192, + "output": 512 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-09", - "release_date": "2024-12", - "last_updated": "2024-12", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01", + "last_updated": "2024-01", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.5, + "output": 1.4 + } }, { - "id": "nvidia/parakeet-tdt-0.6b-v2", - "name": "Parakeet TDT 0.6B v2", - "display_name": "Parakeet TDT 0.6B v2", + "id": "qwen2-5-14b-instruct", + "name": "Qwen2.5 14B Instruct", + "display_name": "Qwen2.5 14B Instruct", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 131072, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-05", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.35, + "output": 1.4 + } }, { - "id": "nvidia/nemoretriever-ocr-v1", - "name": "NeMo Retriever OCR v1", - "display_name": "NeMo Retriever OCR v1", + "id": "qwq-plus", + "name": "QwQ Plus", + "display_name": "QwQ Plus", "modalities": { "input": [ - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true, + "budget": { + "default": 32768, + "min": 0, + "max": 32768 + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, "open_weights": false, - "knowledge": "2024-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-05", + "knowledge": "2024-04", + "release_date": "2025-03-05", + "last_updated": "2025-03-05", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.8, + "output": 2.4 + } }, { - "id": "nvidia/llama-3.3-nemotron-super-49b-v1", - "name": "Llama 3.3 Nemotron Super 49b V1", - "display_name": "Llama 3.3 Nemotron Super 49b V1", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder 30B-A3B Instruct", + "display_name": "Qwen3-Coder 30B-A3B Instruct", "modalities": { "input": [ "text" @@ -4361,59 +4367,60 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-03-16", - "last_updated": "2025-03-16", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.45, + "output": 2.25 + } }, { - "id": "nvidia/llama-3.1-nemotron-51b-instruct", - "name": "Llama 3.1 Nemotron 51b Instruct", - "display_name": "Llama 3.1 Nemotron 51b Instruct", + "id": "qwen-vl-ocr", + "name": "Qwen Vl Ocr", + "display_name": "Qwen Vl Ocr", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 34096, "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-09-22", - "last_updated": "2024-09-22", + "knowledge": "2024-04", + "release_date": "2024-10-28", + "last_updated": "2025-04-13", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.72, + "output": 0.72 + } }, { - "id": "nvidia/llama3-chatqa-1.5-70b", - "name": "Llama3 Chatqa 1.5 70b", - "display_name": "Llama3 Chatqa 1.5 70b", + "id": "qwen2-5-72b-instruct", + "name": "Qwen2.5 72B Instruct", + "display_name": "Qwen2.5 72B Instruct", "modalities": { "input": [ "text" @@ -4423,8 +4430,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -4432,30 +4439,34 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-04-28", - "last_updated": "2024-04-28", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 1.4, + "output": 5.6 + } }, { - "id": "nvidia/llama-3.1-nemotron-ultra-253b-v1", - "name": "Llama-3.1-Nemotron-Ultra-253B-v1", - "display_name": "Llama-3.1-Nemotron-Ultra-253B-v1", + "id": "qwen3-omni-flash", + "name": "Qwen3-Omni Flash", + "display_name": "Qwen3-Omni Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 65536, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -4465,19 +4476,20 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-01", - "last_updated": "2025-09-05", + "knowledge": "2024-04", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.43, + "output": 1.66, + "input_audio": 3.81, + "output_audio": 15.11 + } }, { - "id": "nvidia/llama-3.1-nemotron-70b-instruct", - "name": "Llama 3.1 Nemotron 70b Instruct", - "display_name": "Llama 3.1 Nemotron 70b Instruct", + "id": "qwen-flash", + "name": "Qwen Flash", + "display_name": "Qwen Flash", "modalities": { "input": [ "text" @@ -4487,28 +4499,40 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, "open_weights": false, - "release_date": "2024-10-12", - "last_updated": "2024-10-12", + "knowledge": "2024-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.05, + "output": 0.4 + } }, { - "id": "nvidia/nemotron-4-340b-instruct", - "name": "Nemotron 4 340b Instruct", - "display_name": "Nemotron 4 340b Instruct", + "id": "qwen3-8b", + "name": "Qwen3 8B", + "display_name": "Qwen3 8B", "modalities": { "input": [ "text" @@ -4518,92 +4542,104 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, "attachment": false, - "open_weights": false, - "release_date": "2024-06-13", - "last_updated": "2024-06-13", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.18, + "output": 0.7, + "reasoning": 2.1 + } }, { - "id": "nvidia/llama-3.3-nemotron-super-49b-v1.5", - "name": "Llama 3.3 Nemotron Super 49b V1.5", - "display_name": "Llama 3.3 Nemotron Super 49b V1.5", + "id": "qwen3-omni-flash-realtime", + "name": "Qwen3-Omni Flash Realtime", + "display_name": "Qwen3-Omni Flash Realtime", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 65536, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-03-16", - "last_updated": "2025-03-16", + "knowledge": "2024-04", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.52, + "output": 1.99, + "input_audio": 4.57, + "output_audio": 18.13 + } }, { - "id": "minimaxai/minimax-m2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "qwen2-5-vl-72b-instruct", + "name": "Qwen2.5-VL 72B Instruct", + "display_name": "Qwen2.5-VL 72B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-10-27", - "last_updated": "2025-10-31", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 2.8, + "output": 8.4 + } }, { - "id": "google/gemma-3n-e2b-it", - "name": "Gemma 3n E2b It", - "display_name": "Gemma 3n E2b It", + "id": "qwen3-vl-plus", + "name": "Qwen3 VL Plus", + "display_name": "Qwen3 VL Plus", "modalities": { "input": [ "text", @@ -4614,29 +4650,35 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-06-12", - "last_updated": "2025-06-12", + "attachment": false, + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.2, + "output": 1.6, + "reasoning": 4.8 + } }, { - "id": "google/codegemma-1.1-7b", - "name": "Codegemma 1.1 7b", - "display_name": "Codegemma 1.1 7b", + "id": "qwen-plus", + "name": "Qwen Plus", + "display_name": "Qwen Plus", "modalities": { "input": [ "text" @@ -4646,72 +4688,87 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "release_date": "2024-04-30", - "last_updated": "2024-04-30", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-09-11", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.4, + "output": 1.2, + "reasoning": 4 + } }, { - "id": "google/gemma-3n-e4b-it", - "name": "Gemma 3n E4b It", - "display_name": "Gemma 3n E4b It", + "id": "qwen2-5-32b-instruct", + "name": "Qwen2.5 32B Instruct", + "display_name": "Qwen2.5 32B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-06-03", - "last_updated": "2025-06-03", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.7, + "output": 2.8 + } }, { - "id": "google/gemma-2-2b-it", - "name": "Gemma 2 2b It", - "display_name": "Gemma 2 2b It", + "id": "qwen2-5-omni-7b", + "name": "Qwen2.5-Omni 7B", + "display_name": "Qwen2.5-Omni 7B", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 32768, + "output": 2048 }, "temperature": true, "tool_call": true, @@ -4720,18 +4777,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-07-16", - "last_updated": "2024-07-16", + "knowledge": "2024-04", + "release_date": "2024-12", + "last_updated": "2024-12", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.1, + "output": 0.4, + "input_audio": 6.76 + } }, { - "id": "google/gemma-3-12b-it", - "name": "Gemma 3 12b It", - "display_name": "Gemma 3 12b It", + "id": "qwen-max", + "name": "Qwen Max", + "display_name": "Qwen Max", "modalities": { "input": [ "text" @@ -4741,28 +4799,34 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" + }, "attachment": false, - "open_weights": true, - "release_date": "2025-03-01", - "last_updated": "2025-03-01", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-04-03", + "last_updated": "2025-01-25", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 1.6, + "output": 6.4 + } }, { - "id": "google/codegemma-7b", - "name": "Codegemma 7b", - "display_name": "Codegemma 7b", + "id": "qwen2-5-7b-instruct", + "name": "Qwen2.5 7B Instruct", + "display_name": "Qwen2.5 7B Instruct", "modalities": { "input": [ "text" @@ -4772,28 +4836,28 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-03-21", - "last_updated": "2024-03-21", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.175, + "output": 0.7 + } }, { - "id": "google/gemma-3-1b-it", - "name": "Gemma 3 1b It", - "display_name": "Gemma 3 1b It", + "id": "qwen2-5-vl-7b-instruct", + "name": "Qwen2.5-VL 7B Instruct", + "display_name": "Qwen2.5-VL 7B Instruct", "modalities": { "input": [ "text", @@ -4804,28 +4868,28 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-03-10", - "last_updated": "2025-03-10", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.35, + "output": 1.05 + } }, { - "id": "google/gemma-2-27b-it", - "name": "Gemma 2 27b It", - "display_name": "Gemma 2 27b It", + "id": "qwen3-235b-a22b", + "name": "Qwen3 235B A22B", + "display_name": "Qwen3 235B A22B", "modalities": { "input": [ "text" @@ -4835,193 +4899,195 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "attachment": false, "open_weights": true, - "release_date": "2024-06-24", - "last_updated": "2024-06-24", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.7, + "output": 2.8, + "reasoning": 8.4 + } }, { - "id": "google/gemma-3-27b-it", - "name": "Gemma-3-27B-IT", - "display_name": "Gemma-3-27B-IT", + "id": "qwen-omni-turbo-realtime", + "name": "Qwen-Omni Turbo Realtime", + "display_name": "Qwen-Omni Turbo Realtime", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32768, + "output": 2048 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2025-09-05", + "knowledge": "2024-04", + "release_date": "2025-05-08", + "last_updated": "2025-05-08", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.27, + "output": 1.07, + "input_audio": 4.44, + "output_audio": 8.89 + } }, { - "id": "microsoft/phi-3-medium-128k-instruct", - "name": "Phi 3 Medium 128k Instruct", - "display_name": "Phi 3 Medium 128k Instruct", + "id": "qwen-mt-turbo", + "name": "Qwen Mt Turbo", + "display_name": "Qwen Mt Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 16384, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-05-07", - "last_updated": "2024-05-07", + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01", + "last_updated": "2025-01", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.16, + "output": 0.49 + } }, { - "id": "microsoft/phi-3-small-128k-instruct", - "name": "Phi 3 Small 128k Instruct", - "display_name": "Phi 3 Small 128k Instruct", + "id": "qwen3-coder-480b-a35b-instruct", + "name": "Qwen3-Coder 480B-A35B Instruct", + "display_name": "Qwen3-Coder 480B-A35B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-05-07", - "last_updated": "2024-05-07", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 1.5, + "output": 7.5 + } }, { - "id": "microsoft/phi-3.5-vision-instruct", - "name": "Phi 3.5 Vision Instruct", - "display_name": "Phi 3.5 Vision Instruct", + "id": "qwen-mt-plus", + "name": "Qwen Mt Plus", + "display_name": "Qwen Mt Plus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 16384, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-08-16", - "last_updated": "2024-08-16", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01", + "last_updated": "2025-01", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 2.46, + "output": 7.37 + } }, { - "id": "microsoft/phi-3-small-8k-instruct", - "name": "Phi 3 Small 8k Instruct", - "display_name": "Phi 3 Small 8k Instruct", + "id": "qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8000, - "output": 4096 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-05-07", - "last_updated": "2024-05-07", + "attachment": false, + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 1.2, + "output": 6 + } }, { - "id": "microsoft/phi-3.5-moe-instruct", - "name": "Phi 3.5 Moe Instruct", - "display_name": "Phi 3.5 Moe Instruct", + "id": "qwen3-coder-plus", + "name": "Qwen3 Coder Plus", + "display_name": "Qwen3 Coder Plus", "modalities": { "input": [ "text" @@ -5031,8 +5097,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -5041,23 +5107,21 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-08-17", - "last_updated": "2024-08-17", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 1, + "output": 5 + } }, { - "id": "microsoft/phi-4-mini-instruct", - "name": "Phi-4-Mini", - "display_name": "Phi-4-Mini", + "id": "qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" @@ -5065,62 +5129,71 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2025-09-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09", + "last_updated": "2025-09", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.5, + "output": 6 + } }, { - "id": "microsoft/phi-3-medium-4k-instruct", - "name": "Phi 3 Medium 4k Instruct", - "display_name": "Phi 3 Medium 4k Instruct", + "id": "qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 4000, - "output": 4096 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-05-07", - "last_updated": "2024-05-07", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.7, + "output": 2.8, + "reasoning": 8.4 + } }, { - "id": "microsoft/phi-3-vision-128k-instruct", - "name": "Phi 3 Vision 128k Instruct", - "display_name": "Phi 3 Vision 128k Instruct", + "id": "qwen-vl-plus", + "name": "Qwen-VL Plus", + "display_name": "Qwen-VL Plus", "modalities": { "input": [ "text", @@ -5131,8 +5204,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -5140,51 +5213,42 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-05-19", - "last_updated": "2024-05-19", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-08-15", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.21, + "output": 0.63 + } }, { - "id": "openai/whisper-large-v3", - "name": "Whisper Large v3", - "display_name": "Whisper Large v3", + "id": "qwen3-coder-plus-2025-09-23", + "name": "Qwen3 Coder Plus 2025 09 23", + "display_name": "Qwen3 Coder Plus 2025 09 23", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 1000000, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-09", - "release_date": "2023-09-01", - "last_updated": "2025-09-05", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "attachment": false }, { - "id": "openai/gpt-oss-120b", - "name": "GPT-OSS-120B", - "display_name": "GPT-OSS-120B", + "id": "qwen3-coder-plus-2025-07-22", + "name": "Qwen3 Coder Plus 2025 07 22", + "display_name": "Qwen3 Coder Plus 2025 07 22", "modalities": { "input": [ "text" @@ -5194,93 +5258,74 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08", - "release_date": "2025-08-04", - "last_updated": "2025-08-14", - "cost": { - "input": 0, - "output": 0 + "supported": false }, - "type": "chat" + "attachment": false }, { - "id": "qwen/qwen3-next-80b-a3b-instruct", - "name": "Qwen3-Next-80B-A3B-Instruct", - "display_name": "Qwen3-Next-80B-A3B-Instruct", + "id": "qwen-vl-ocr-latest", + "name": "Qwen Vl Ocr Latest", + "display_name": "Qwen Vl Ocr Latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 34096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2025-09-05", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "attachment": false }, { - "id": "qwen/qwen2.5-coder-32b-instruct", - "name": "Qwen2.5 Coder 32b Instruct", - "display_name": "Qwen2.5 Coder 32b Instruct", + "id": "qvq-max-2025-05-15", + "name": "Qvq Max 2025 05 15", + "display_name": "Qvq Max 2025 05 15", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2024-11-06", - "last_updated": "2024-11-06", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": false, + "budget": { + "default": 16384, + "min": 0, + "max": 16384 + } }, - "type": "chat" + "attachment": false }, { - "id": "qwen/qwen2.5-coder-7b-instruct", - "name": "Qwen2.5 Coder 7b Instruct", - "display_name": "Qwen2.5 Coder 7b Instruct", + "id": "qwen-long", + "name": "Qwen Long", + "display_name": "Qwen Long", "modalities": { "input": [ "text" @@ -5290,28 +5335,20 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-09-17", - "last_updated": "2024-09-17", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "attachment": false }, { - "id": "qwen/qwen3-235b-a22b", - "name": "Qwen3-235B-A22B", - "display_name": "Qwen3-235B-A22B", + "id": "qwen-turbo-latest", + "name": "Qwen Turbo Latest", + "display_name": "Qwen Turbo Latest", "modalities": { "input": [ "text" @@ -5322,29 +5359,31 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2025-09-05", - "cost": { - "input": 0, - "output": 0 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "type": "chat" + "attachment": false }, { - "id": "qwen/qwen3-coder-480b-a35b-instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "qwen-turbo-2024-09-19", + "name": "Qwen Turbo 2024 09 19", + "display_name": "Qwen Turbo 2024 09 19", "modalities": { "input": [ "text" @@ -5354,29 +5393,20 @@ ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "attachment": false }, { - "id": "qwen/qwq-32b", - "name": "Qwq 32b", - "display_name": "Qwq 32b", + "id": "qwen-flash-2025-07-28", + "name": "Qwen Flash 2025 07 28", + "display_name": "Qwen Flash 2025 07 28", "modalities": { "input": [ "text" @@ -5386,29 +5416,32 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-03-05", - "last_updated": "2025-03-05", - "cost": { - "input": 0, - "output": 0 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "type": "chat" + "attachment": false }, { - "id": "qwen/qwen3-next-80b-a3b-thinking", - "name": "Qwen3-Next-80B-A3B-Thinking", - "display_name": "Qwen3-Next-80B-A3B-Thinking", + "id": "qwen-plus-latest", + "name": "Qwen Plus Latest", + "display_name": "Qwen Plus Latest", "modalities": { "input": [ "text" @@ -5418,30 +5451,32 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2025-09-05", - "cost": { - "input": 0, - "output": 0 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "type": "chat" + "attachment": false }, { - "id": "mistralai/devstral-2-123b-instruct-2512", - "name": "Devstral-2-123B-Instruct-2512", - "display_name": "Devstral-2-123B-Instruct-2512", + "id": "qwen-plus-2024-09-19", + "name": "Qwen Plus 2024 09 19", + "display_name": "Qwen Plus 2024 09 19", "modalities": { "input": [ "text" @@ -5451,96 +5486,90 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-08", - "last_updated": "2025-12-09", - "cost": { - "input": 0, - "output": 0 + "supported": false }, - "type": "chat" + "attachment": false }, { - "id": "mistralai/mistral-large-3-675b-instruct-2512", - "name": "Mistral Large 3 675B Instruct 2512", - "display_name": "Mistral Large 3 675B Instruct 2512", + "id": "qwen-plus-2025-07-14", + "name": "Qwen Plus 2025 07 14", + "display_name": "Qwen Plus 2025 07 14", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-12-02", - "last_updated": "2025-12-02", - "cost": { - "input": 0, - "output": 0 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "type": "chat" + "attachment": false }, { - "id": "mistralai/ministral-14b-instruct-2512", - "name": "Ministral 3 14B Instruct 2512", - "display_name": "Ministral 3 14B Instruct 2512", + "id": "qwen-plus-2025-09-11", + "name": "Qwen Plus 2025 09 11", + "display_name": "Qwen Plus 2025 09 11", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-01", - "last_updated": "2025-12-08", - "cost": { - "input": 0, - "output": 0 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "type": "chat" + "attachment": false }, { - "id": "mistralai/mamba-codestral-7b-v0.1", - "name": "Mamba Codestral 7b V0.1", - "display_name": "Mamba Codestral 7b V0.1", + "id": "qwen-max-latest", + "name": "Qwen Max Latest", + "display_name": "Qwen Max Latest", "modalities": { "input": [ "text" @@ -5550,28 +5579,26 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-16", - "last_updated": "2024-07-16", - "cost": { - "input": 0, - "output": 0 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "type": "chat" + "attachment": false }, { - "id": "mistralai/mistral-large-2-instruct", - "name": "Mistral Large 2 Instruct", - "display_name": "Mistral Large 2 Instruct", + "id": "qwen-max-2024-09-19", + "name": "Qwen Max 2024 09 19", + "display_name": "Qwen Max 2024 09 19", "modalities": { "input": [ "text" @@ -5581,28 +5608,26 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-24", - "last_updated": "2024-07-24", - "cost": { - "input": 0, - "output": 0 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "type": "chat" + "attachment": false }, { - "id": "mistralai/codestral-22b-instruct-v0.1", - "name": "Codestral 22b Instruct V0.1", - "display_name": "Codestral 22b Instruct V0.1", + "id": "qwen-max-2024-04-28", + "name": "Qwen Max 2024 04 28", + "display_name": "Qwen Max 2024 04 28", "modalities": { "input": [ "text" @@ -5612,28 +5637,20 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 8000, + "output": 2000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-05-29", - "last_updated": "2024-05-29", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "attachment": false }, { - "id": "mistralai/mistral-small-3.1-24b-instruct-2503", - "name": "Mistral Small 3.1 24b Instruct 2503", - "display_name": "Mistral Small 3.1 24b Instruct 2503", + "id": "qwen-max-2024-04-03", + "name": "Qwen Max 2024 04 03", + "display_name": "Qwen Max 2024 04 03", "modalities": { "input": [ "text" @@ -5643,61 +5660,49 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 8000, + "output": 2000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-03-11", - "last_updated": "2025-03-11", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "attachment": false }, { - "id": "meta/llama-3.2-11b-vision-instruct", - "name": "Llama 3.2 11b Vision Instruct", - "display_name": "Llama 3.2 11b Vision Instruct", + "id": "qwen-max-2025-01-25", + "name": "Qwen Max 2025 01 25", + "display_name": "Qwen Max 2025 01 25", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-18", - "last_updated": "2024-09-18", - "cost": { - "input": 0, - "output": 0 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "type": "chat" + "attachment": false }, { - "id": "meta/llama3-70b-instruct", - "name": "Llama3 70b Instruct", - "display_name": "Llama3 70b Instruct", + "id": "qwen3-max-2025-09-23", + "name": "Qwen3 Max 20250923", + "display_name": "Qwen3 Max 20250923", "modalities": { "input": [ "text" @@ -5707,28 +5712,26 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-04-17", - "last_updated": "2024-04-17", - "cost": { - "input": 0, - "output": 0 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "type": "chat" + "attachment": false }, { - "id": "meta/llama-3.3-70b-instruct", - "name": "Llama 3.3 70b Instruct", - "display_name": "Llama 3.3 70b Instruct", + "id": "qwen3-max-preview", + "name": "Qwen3 Max Preview", + "display_name": "Qwen3 Max Preview", "modalities": { "input": [ "text" @@ -5738,28 +5741,26 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-11-26", - "last_updated": "2024-11-26", - "cost": { - "input": 0, - "output": 0 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "type": "chat" + "attachment": false }, { - "id": "meta/llama-3.2-1b-instruct", - "name": "Llama 3.2 1b Instruct", - "display_name": "Llama 3.2 1b Instruct", + "id": "qwen3-235b-a22b-thinking-2507", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ "text" @@ -5769,95 +5770,72 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-18", - "last_updated": "2024-09-18", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "type": "chat" + "attachment": false }, { - "id": "meta/llama-4-scout-17b-16e-instruct", - "name": "Llama 4 Scout 17b 16e Instruct", - "display_name": "Llama 4 Scout 17b 16e Instruct", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-02", - "release_date": "2025-04-02", - "last_updated": "2025-04-02", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "attachment": false }, { - "id": "meta/llama-4-maverick-17b-128e-instruct", - "name": "Llama 4 Maverick 17b 128e Instruct", - "display_name": "Llama 4 Maverick 17b 128e Instruct", + "id": "qwen3-30b-a3b-instruct-2507", + "name": "Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-02", - "release_date": "2025-04-01", - "last_updated": "2025-04-01", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "attachment": false }, { - "id": "meta/codellama-70b", - "name": "Codellama 70b", - "display_name": "Codellama 70b", + "id": "qwen3-30b-a3b-thinking-2507", + "name": "Qwen3 30B A3B Thinking 2507", + "display_name": "Qwen3 30B A3B Thinking 2507", "modalities": { "input": [ "text" @@ -5867,28 +5845,26 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2024-01-29", - "last_updated": "2024-01-29", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "type": "chat" + "attachment": false }, { - "id": "meta/llama-3.1-405b-instruct", - "name": "Llama 3.1 405b Instruct", - "display_name": "Llama 3.1 405b Instruct", + "id": "qwen3-30b-a3b", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", "modalities": { "input": [ "text" @@ -5898,28 +5874,26 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-16", - "last_updated": "2024-07-16", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "type": "chat" + "attachment": false }, { - "id": "meta/llama3-8b-instruct", - "name": "Llama3 8b Instruct", - "display_name": "Llama3 8b Instruct", + "id": "qwen3-4b", + "name": "Qwen3 4B", + "display_name": "Qwen3 4B", "modalities": { "input": [ "text" @@ -5929,28 +5903,26 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2024-04-17", - "last_updated": "2024-04-17", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, - "type": "chat" + "attachment": false }, { - "id": "meta/llama-3.1-70b-instruct", - "name": "Llama 3.1 70b Instruct", - "display_name": "Llama 3.1 70b Instruct", + "id": "qwen3-1.7b", + "name": "Qwen3 1.7B", + "display_name": "Qwen3 1.7B", "modalities": { "input": [ "text" @@ -5960,28 +5932,26 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-16", - "last_updated": "2024-07-16", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true, + "budget": { + "default": 30720, + "min": 0, + "max": 30720 + } }, - "type": "chat" + "attachment": false }, { - "id": "deepseek-ai/deepseek-r1-0528", - "name": "Deepseek R1 0528", - "display_name": "Deepseek R1 0528", + "id": "qwen3-0.6b", + "name": "Qwen3 0.6B", + "display_name": "Qwen3 0.6B", "modalities": { "input": [ "text" @@ -5991,61 +5961,56 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-05-28", - "last_updated": "2025-05-28", - "cost": { - "input": 0, - "output": 0 + "default": true, + "budget": { + "default": 30720, + "min": 0, + "max": 30720 + } }, - "type": "chat" + "attachment": false }, { - "id": "deepseek-ai/deepseek-r1", - "name": "Deepseek R1", - "display_name": "Deepseek R1", + "id": "qwen3-vl-plus-2025-09-23", + "name": "Qwen3 VL Plus 2025 09 23", + "display_name": "Qwen3 VL Plus 2025 09 23", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": false, "reasoning": { "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", - "cost": { - "input": 0, - "output": 0 + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "type": "chat" + "attachment": false }, { - "id": "deepseek-ai/deepseek-v3.1-terminus", - "name": "DeepSeek V3.1 Terminus", - "display_name": "DeepSeek V3.1 Terminus", + "id": "qwq-plus-latest", + "name": "QwQ Plus Latest", + "display_name": "QwQ Plus Latest", "modalities": { "input": [ "text" @@ -6055,63 +6020,70 @@ ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 32768, + "min": 0, + "max": 32768 + } }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-22", - "last_updated": "2025-09-22", - "cost": { - "input": 0, - "output": 0 + "search": { + "supported": false }, - "type": "chat" - }, + "attachment": false + } + ] + }, + "xai": { + "id": "xai", + "name": "xai", + "display_name": "xai", + "doc": "https://docs.x.ai/docs/models", + "models": [ { - "id": "deepseek-ai/deepseek-v3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "grok-4-fast-non-reasoning", + "name": "Grok 4 Fast (Non-Reasoning)", + "display_name": "Grok 4 Fast (Non-Reasoning)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-08-20", - "last_updated": "2025-08-26", + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + } }, { - "id": "deepseek-ai/deepseek-coder-6.7b-instruct", - "name": "Deepseek Coder 6.7b Instruct", - "display_name": "Deepseek Coder 6.7b Instruct", + "id": "grok-3-fast", + "name": "Grok 3 Fast", + "display_name": "Grok 3 Fast", "modalities": { "input": [ "text" @@ -6121,8 +6093,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -6130,91 +6102,87 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2023-10-29", - "last_updated": "2023-10-29", + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 5, + "output": 25, + "cache_read": 1.25 + } }, { - "id": "black-forest-labs/flux.1-dev", - "name": "FLUX.1-dev", - "display_name": "FLUX.1-dev", + "id": "grok-4", + "name": "Grok 4", + "display_name": "Grok 4", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 4096, - "output": 8192 + "context": 256000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-01", - "last_updated": "2025-09-05", + "knowledge": "2025-07", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - } - ] - }, - "cohere": { - "id": "cohere", - "name": "Cohere", - "display_name": "Cohere", - "doc": "https://docs.cohere.com/docs/models", - "models": [ + "input": 3, + "output": 15, + "reasoning": 15, + "cache_read": 0.75 + } + }, { - "id": "command-a-translate-08-2025", - "name": "Command A Translate", - "display_name": "Command A Translate", + "id": "grok-2-vision", + "name": "Grok 2 Vision", + "display_name": "Grok 2 Vision", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8000, - "output": 8000 + "context": 8192, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "attachment": true, + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 2.5, - "output": 10 - }, - "type": "chat" + "input": 2, + "output": 10, + "cache_read": 2 + } }, { - "id": "command-a-03-2025", - "name": "Command A", - "display_name": "Command A", + "id": "grok-code-fast-1", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ "text" @@ -6225,7 +6193,7 @@ }, "limit": { "context": 256000, - "output": 8000 + "output": 10000 }, "temperature": true, "tool_call": true, @@ -6234,20 +6202,20 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "open_weights": false, + "knowledge": "2023-10", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 2.5, - "output": 10 - }, - "type": "chat" + "input": 0.2, + "output": 1.5, + "cache_read": 0.02 + } }, { - "id": "command-r-08-2024", - "name": "Command R", - "display_name": "Command R", + "id": "grok-2", + "name": "Grok 2", + "display_name": "Grok 2", "modalities": { "input": [ "text" @@ -6257,30 +6225,29 @@ ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.15, - "output": 0.6 - }, - "type": "chat" + "input": 2, + "output": 10, + "cache_read": 2 + } }, { - "id": "command-r-plus-08-2024", - "name": "Command R+", - "display_name": "Command R+", + "id": "grok-3-mini-fast-latest", + "name": "Grok 3 Mini Fast Latest", + "display_name": "Grok 3 Mini Fast Latest", "modalities": { "input": [ "text" @@ -6290,8 +6257,8 @@ ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -6300,52 +6267,57 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 2.5, - "output": 10 - }, - "type": "chat" + "input": 0.6, + "output": 4, + "reasoning": 4, + "cache_read": 0.15 + } }, { - "id": "command-r7b-12-2024", - "name": "Command R7B", - "display_name": "Command R7B", + "id": "grok-2-vision-1212", + "name": "Grok 2 Vision 1212", + "display_name": "Grok 2 Vision 1212", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 32000, + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, + "search": { + "supported": false + }, "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-02-27", - "last_updated": "2024-02-27", + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2024-08-20", + "last_updated": "2024-12-12", "cost": { - "input": 0.0375, - "output": 0.15 - }, - "type": "chat" + "input": 2, + "output": 10, + "cache_read": 2 + } }, { - "id": "command-a-reasoning-08-2025", - "name": "Command A Reasoning", - "display_name": "Command A Reasoning", + "id": "grok-3", + "name": "Grok 3", + "display_name": "Grok 3", "modalities": { "input": [ "text" @@ -6355,30 +6327,29 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 2.5, - "output": 10 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.75 + } }, { - "id": "command-a-vision-07-2025", - "name": "Command A Vision", - "display_name": "Command A Vision", + "id": "grok-4-fast", + "name": "Grok 4 Fast", + "display_name": "Grok 4 Fast", "modalities": { "input": [ "text", @@ -6389,38 +6360,30 @@ ] }, "limit": { - "context": 128000, - "output": 8000 + "context": 2000000, + "output": 30000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-07-31", - "last_updated": "2025-07-31", + "attachment": true, + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 2.5, - "output": 10 - }, - "type": "chat" - } - ] - }, - "upstage": { - "id": "upstage", - "name": "Upstage", - "display_name": "Upstage", - "api": "https://api.upstage.ai", - "doc": "https://developers.upstage.ai/docs/apis/chat", - "models": [ + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + } + }, { - "id": "solar-mini", - "name": "solar-mini", - "display_name": "solar-mini", + "id": "grok-2-latest", + "name": "Grok 2 Latest", + "display_name": "Grok 2 Latest", "modalities": { "input": [ "text" @@ -6430,8 +6393,8 @@ ] }, "limit": { - "context": 32768, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -6440,30 +6403,31 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-06-12", - "last_updated": "2025-04-22", + "knowledge": "2024-08", + "release_date": "2024-08-20", + "last_updated": "2024-12-12", "cost": { - "input": 0.15, - "output": 0.15 - }, - "type": "chat" + "input": 2, + "output": 10, + "cache_read": 2 + } }, { - "id": "solar-pro2", - "name": "solar-pro2", - "display_name": "solar-pro2", + "id": "grok-4-1-fast", + "name": "Grok 4.1 Fast", + "display_name": "Grok 4.1 Fast", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -6471,29 +6435,21 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "knowledge": "2025-07", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "cost": { - "input": 0.25, - "output": 0.25 - }, - "type": "chat" - } - ] - }, - "groq": { - "id": "groq", - "name": "Groq", - "display_name": "Groq", - "doc": "https://console.groq.com/docs/models", - "models": [ + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + } + }, { - "id": "llama-3.1-8b-instant", - "name": "Llama 3.1 8B Instant", - "display_name": "Llama 3.1 8B Instant", + "id": "grok-2-1212", + "name": "Grok 2 1212", + "display_name": "Grok 2 1212", "modalities": { "input": [ "text" @@ -6503,29 +6459,32 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 120000, + "output": 100000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "search": { + "supported": false + }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2024-12-12", + "last_updated": "2024-12-12", "cost": { - "input": 0.05, - "output": 0.08 - }, - "type": "chat" + "input": 2, + "output": 10, + "cache_read": 2 + } }, { - "id": "mistral-saba-24b", - "name": "Mistral Saba 24B", - "display_name": "Mistral Saba 24B", + "id": "grok-3-fast-latest", + "name": "Grok 3 Fast Latest", + "display_name": "Grok 3 Fast Latest", "modalities": { "input": [ "text" @@ -6535,8 +6494,8 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -6545,19 +6504,19 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2025-02-06", - "last_updated": "2025-02-06", + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 0.79, - "output": 0.79 - }, - "type": "chat" + "input": 5, + "output": 25, + "cache_read": 1.25 + } }, { - "id": "llama3-8b-8192", - "name": "Llama 3 8B", - "display_name": "Llama 3 8B", + "id": "grok-3-latest", + "name": "Grok 3 Latest", + "display_name": "Grok 3 Latest", "modalities": { "input": [ "text" @@ -6567,7 +6526,7 @@ ] }, "limit": { - "context": 8192, + "context": 131072, "output": 8192 }, "temperature": true, @@ -6576,56 +6535,57 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-03", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 0.05, - "output": 0.08 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.75 + } }, { - "id": "qwen-qwq-32b", - "name": "Qwen QwQ 32B", - "display_name": "Qwen QwQ 32B", + "id": "grok-2-vision-latest", + "name": "Grok 2 Vision Latest", + "display_name": "Grok 2 Vision Latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 8192, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-09", - "release_date": "2024-11-27", - "last_updated": "2024-11-27", + "attachment": true, + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2024-08-20", + "last_updated": "2024-12-12", "cost": { - "input": 0.29, - "output": 0.39 - }, - "type": "chat" + "input": 2, + "output": 10, + "cache_read": 2 + } }, { - "id": "llama3-70b-8192", - "name": "Llama 3 70B", - "display_name": "Llama 3 70B", + "id": "grok-vision-beta", + "name": "Grok Vision Beta", + "display_name": "Grok Vision Beta", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -6633,28 +6593,28 @@ }, "limit": { "context": 8192, - "output": 8192 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-03", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "attachment": true, + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.59, - "output": 0.79 - }, - "type": "chat" + "input": 5, + "output": 15, + "cache_read": 5 + } }, { - "id": "deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "grok-3-mini", + "name": "Grok 3 Mini", + "display_name": "Grok 3 Mini", "modalities": { "input": [ "text" @@ -6674,20 +6634,21 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 0.75, - "output": 0.99 - }, - "type": "chat" + "input": 0.3, + "output": 0.5, + "reasoning": 0.5, + "cache_read": 0.075 + } }, { - "id": "llama-guard-3-8b", - "name": "Llama Guard 3 8B", - "display_name": "Llama Guard 3 8B", + "id": "grok-beta", + "name": "Grok Beta", + "display_name": "Grok Beta", "modalities": { "input": [ "text" @@ -6697,28 +6658,29 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131072, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.2, - "output": 0.2 - }, - "type": "chat" + "input": 5, + "output": 15, + "cache_read": 5 + } }, { - "id": "gemma2-9b-it", - "name": "Gemma 2 9B", - "display_name": "Gemma 2 9B", + "id": "grok-3-mini-latest", + "name": "Grok 3 Mini Latest", + "display_name": "Grok 3 Mini Latest", "modalities": { "input": [ "text" @@ -6728,61 +6690,64 @@ ] }, "limit": { - "context": 8192, + "context": 131072, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2024-06-27", - "last_updated": "2024-06-27", + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 0.2, - "output": 0.2 - }, - "type": "chat" + "input": 0.3, + "output": 0.5, + "reasoning": 0.5, + "cache_read": 0.075 + } }, { - "id": "llama-3.3-70b-versatile", - "name": "Llama 3.3 70B Versatile", - "display_name": "Llama 3.3 70B Versatile", + "id": "grok-4-1-fast-non-reasoning", + "name": "Grok 4.1 Fast (Non-Reasoning)", + "display_name": "Grok 4.1 Fast (Non-Reasoning)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "attachment": true, + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "cost": { - "input": 0.59, - "output": 0.79 - }, - "type": "chat" + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + } }, { - "id": "moonshotai/kimi-k2-instruct-0905", - "name": "Kimi K2 Instruct 0905", - "display_name": "Kimi K2 Instruct 0905", + "id": "grok-3-mini-fast", + "name": "Grok 3 Mini Fast", + "display_name": "Grok 3 Mini Fast", "modalities": { "input": [ "text" @@ -6792,29 +6757,31 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 1, - "output": 3 - }, - "type": "chat" + "input": 0.6, + "output": 4, + "reasoning": 4, + "cache_read": 0.15 + } }, { - "id": "moonshotai/kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "grok-3-mini-fast-beta", + "name": "Grok 3 Mini Fast Beta", + "display_name": "Grok 3 Mini Fast Beta", "modalities": { "input": [ "text" @@ -6824,29 +6791,25 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 120000, + "output": 100000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true, + "effort": "low" }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-14", - "last_updated": "2025-07-14", - "cost": { - "input": 1, - "output": 3 + "search": { + "supported": false }, - "type": "chat" + "attachment": false }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "grok-3-mini-beta", + "name": "Grok 3 Mini Beta", + "display_name": "Grok 3 Mini Beta", "modalities": { "input": [ "text" @@ -6856,29 +6819,25 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 120000, + "output": 100000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "effort": "low" }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 0.075, - "output": 0.3 + "search": { + "supported": false }, - "type": "chat" + "attachment": false }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "grok-3-fast-beta", + "name": "Grok 3 Fast Beta", + "display_name": "Grok 3 Fast Beta", "modalities": { "input": [ "text" @@ -6888,169 +6847,148 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 120000, + "output": 100000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 0.15, - "output": 0.6 + "search": { + "supported": false }, - "type": "chat" + "attachment": false }, { - "id": "qwen/qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "grok-2-image-1212", + "name": "Grok 2 Image 1212", + "display_name": "Grok 2 Image 1212", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 130000, + "output": 100000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-11-08", - "release_date": "2024-12-23", - "last_updated": "2024-12-23", - "cost": { - "input": 0.29, - "output": 0.59 + "search": { + "supported": false }, - "type": "chat" + "attachment": false }, { - "id": "meta-llama/llama-4-scout-17b-16e-instruct", - "name": "Llama 4 Scout 17B", - "display_name": "Llama 4 Scout 17B", + "id": "grok-3-beta", + "name": "Grok 3 Beta", + "display_name": "Grok 3 Beta", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 120000, + "output": 100000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", - "cost": { - "input": 0.11, - "output": 0.34 + "search": { + "supported": false }, - "type": "chat" - }, + "attachment": false + } + ] + }, + "vultr": { + "id": "vultr", + "name": "Vultr", + "display_name": "Vultr", + "api": "https://api.vultrinference.com/v1", + "doc": "https://api.vultrinference.com/", + "models": [ { - "id": "meta-llama/llama-4-maverick-17b-128e-instruct", - "name": "Llama 4 Maverick 17B", - "display_name": "Llama 4 Maverick 17B", + "id": "deepseek-r1-distill-qwen-32b", + "name": "DeepSeek R1 Distill Qwen 32B", + "display_name": "DeepSeek R1 Distill Qwen 32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 121808, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2024-10", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { "input": 0.2, - "output": 0.6 - }, - "type": "chat" + "output": 0.2 + } }, { - "id": "meta-llama/llama-guard-4-12b", - "name": "Llama Guard 4 12B", - "display_name": "Llama Guard 4 12B", + "id": "qwen2.5-coder-32b-instruct", + "name": "Qwen2.5 Coder 32B Instruct", + "display_name": "Qwen2.5 Coder 32B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 1024 + "context": 12952, + "output": 2048 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2024-10", + "release_date": "2024-11-06", + "last_updated": "2024-11-06", "cost": { "input": 0.2, "output": 0.2 - }, - "type": "chat" - } - ] - }, - "bailing": { - "id": "bailing", - "name": "Bailing", - "display_name": "Bailing", - "api": "https://api.tbox.cn/api/llm/v1/chat/completions", - "doc": "https://alipaytbox.yuque.com/sxs0ba/ling/intro", - "models": [ + } + }, { - "id": "Ling-1T", - "name": "Ling-1T", - "display_name": "Ling-1T", + "id": "kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ "text" @@ -7060,8 +6998,8 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 58904, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -7070,19 +7008,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-10", - "last_updated": "2025-10", + "knowledge": "2024-10", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.57, - "output": 2.29 - }, - "type": "chat" + "input": 0.2, + "output": 0.2 + } }, { - "id": "Ring-1T", - "name": "Ring-1T", - "display_name": "Ring-1T", + "id": "deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ "text" @@ -7092,52 +7029,39 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 121808, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-10", - "last_updated": "2025-10", + "knowledge": "2024-10", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.57, - "output": 2.29 - }, - "type": "chat" - } - ] - }, - "github-copilot": { - "id": "github-copilot", - "name": "GitHub Copilot", - "display_name": "GitHub Copilot", - "api": "https://api.githubcopilot.com", - "doc": "https://docs.github.com/en/copilot", - "models": [ + "input": 0.2, + "output": 0.2 + } + }, { - "id": "gemini-2.0-flash-001", - "name": "Gemini 2.0 Flash", - "display_name": "Gemini 2.0 Flash", + "id": "gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 121808, "output": 8192 }, "temperature": true, @@ -7145,91 +7069,94 @@ "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-06-23", + "last_updated": "2025-06-23", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - }, + "input": 0.2, + "output": 0.2 + } + } + ] + }, + "nvidia": { + "id": "nvidia", + "name": "Nvidia", + "display_name": "Nvidia", + "api": "https://integrate.api.nvidia.com/v1", + "doc": "https://docs.api.nvidia.com/nim/", + "models": [ { - "id": "claude-opus-4", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 80000, - "output": 16000 + "context": 262144, + "output": 262144 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash", - "display_name": "Gemini 3 Flash", + "id": "moonshotai/kimi-k2-instruct-0905", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -7239,8 +7166,8 @@ ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -7249,24 +7176,24 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-08", - "release_date": "2025-08-27", - "last_updated": "2025-08-27", + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-11", + "last_updated": "2025-12", "cost": { "input": 0, - "output": 0 - }, - "type": "chat" + "output": 0, + "cache_read": 0, + "cache_write": 0 + } }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1-Codex", - "display_name": "GPT-5.1-Codex", + "id": "moonshotai/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -7274,9 +7201,9 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -7284,31 +7211,29 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2024-01", + "release_date": "2025-01-01", + "last_updated": "2025-09-05", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "claude-haiku-4.5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "nvidia/nvidia-nemotron-nano-9b-v2", + "name": "nvidia-nemotron-nano-9b-v2", + "display_name": "nvidia-nemotron-nano-9b-v2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -7316,26 +7241,24 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-09", + "release_date": "2025-08-18", + "last_updated": "2025-08-18", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "nvidia/cosmos-nemotron-34b", + "name": "Cosmos Nemotron 34B", + "display_name": "Cosmos Nemotron 34B", "modalities": { "input": [ "text", "image", - "audio", "video" ], "output": [ @@ -7343,168 +7266,157 @@ ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2024-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-05", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "oswe-vscode-prime", - "name": "Raptor Mini (Preview)", - "display_name": "Raptor Mini (Preview)", + "id": "nvidia/llama-embed-nemotron-8b", + "name": "Llama Embed Nemotron 8B", + "display_name": "Llama Embed Nemotron 8B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32768, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-11-10", - "last_updated": "2025-11-10", + "knowledge": "2025-03", + "release_date": "2025-03-18", + "last_updated": "2025-03-18", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "claude-3.5-sonnet", - "name": "Claude Sonnet 3.5", - "display_name": "Claude Sonnet 3.5", + "id": "nvidia/nemotron-3-nano-30b-a3b", + "name": "nemotron-3-nano-30b-a3b", + "display_name": "nemotron-3-nano-30b-a3b", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 90000, - "output": 8192 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "attachment": false, + "open_weights": true, + "knowledge": "2024-09", + "release_date": "2024-12", + "last_updated": "2024-12", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "gpt-5.1-codex-mini", - "name": "GPT-5.1-Codex-mini", - "display_name": "GPT-5.1-Codex-mini", + "id": "nvidia/parakeet-tdt-0.6b-v2", + "name": "Parakeet TDT 0.6B v2", + "display_name": "Parakeet TDT 0.6B v2", "modalities": { "input": [ - "text", - "image" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 100000 + "context": 0, + "output": 4096 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2024-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-05", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "nvidia/nemoretriever-ocr-v1", + "name": "NeMo Retriever OCR v1", + "display_name": "NeMo Retriever OCR v1", "modalities": { "input": [ - "text" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 0, + "output": 4096 }, "temperature": false, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "knowledge": "2024-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-05", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "nvidia/llama-3.3-nemotron-super-49b-v1", + "name": "Llama 3.3 Nemotron Super 49b V1", + "display_name": "Llama 3.3 Nemotron Super 49b V1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -7512,33 +7424,29 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 4096 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-03-16", + "last_updated": "2025-03-16", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "gpt-5-codex", - "name": "GPT-5-Codex", - "display_name": "GPT-5-Codex", + "id": "nvidia/llama-3.1-nemotron-51b-instruct", + "name": "Llama 3.1 Nemotron 51b Instruct", + "display_name": "Llama 3.1 Nemotron 51b Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -7546,66 +7454,91 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "release_date": "2024-09-22", + "last_updated": "2024-09-22", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "nvidia/llama3-chatqa-1.5-70b", + "name": "Llama3 Chatqa 1.5 70b", + "display_name": "Llama3 Chatqa 1.5 70b", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 16384 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "release_date": "2024-04-28", + "last_updated": "2024-04-28", "cost": { "input": 0, "output": 0 + } + }, + { + "id": "nvidia/llama-3.1-nemotron-ultra-253b-v1", + "name": "Llama-3.1-Nemotron-Ultra-253B-v1", + "display_name": "Llama-3.1-Nemotron-Ultra-253B-v1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] }, - "type": "chat" + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2024-07-01", + "last_updated": "2025-09-05", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "nvidia/llama-3.1-nemotron-70b-instruct", + "name": "Llama 3.1 Nemotron 70b Instruct", + "display_name": "Llama 3.1 Nemotron 70b Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -7613,28 +7546,26 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2024-10-12", + "last_updated": "2024-10-12", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "o4-mini", - "name": "o4-mini (Preview)", - "display_name": "o4-mini (Preview)", + "id": "nvidia/nemotron-4-340b-instruct", + "name": "Nemotron 4 340b Instruct", + "display_name": "Nemotron 4 340b Instruct", "modalities": { "input": [ "text" @@ -7645,67 +7576,59 @@ }, "limit": { "context": 128000, - "output": 65536 + "output": 4096 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2024-06-13", + "last_updated": "2024-06-13", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "claude-opus-41", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "nvidia/llama-3.3-nemotron-super-49b-v1.5", + "name": "Llama 3.3 Nemotron Super 49b V1.5", + "display_name": "Llama 3.3 Nemotron Super 49b V1.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 80000, - "output": 16000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-03-16", + "last_updated": "2025-03-16", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "gpt-5-mini", - "name": "GPT-5-mini", - "display_name": "GPT-5-mini", + "id": "minimaxai/minimax-m2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -7713,7 +7636,7 @@ }, "limit": { "context": 128000, - "output": 64000 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -7721,60 +7644,55 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-08-13", - "last_updated": "2025-08-13", + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-10-27", + "last_updated": "2025-10-31", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "claude-3.7-sonnet", - "name": "Claude Sonnet 3.7", - "display_name": "Claude Sonnet 3.7", + "id": "minimaxai/minimax-m2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 16384 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "google/gemma-3n-e2b-it", + "name": "Gemma 3n E2b It", + "display_name": "Gemma 3n E2b It", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ "text" @@ -7782,7 +7700,7 @@ }, "limit": { "context": 128000, - "output": 64000 + "output": 4096 }, "temperature": true, "tool_call": true, @@ -7790,24 +7708,22 @@ "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2025-06-12", + "last_updated": "2025-06-12", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "gpt-5.1-codex-max", - "name": "GPT-5.1-Codex-max", - "display_name": "GPT-5.1-Codex-max", + "id": "google/codegemma-1.1-7b", + "name": "Codegemma 1.1 7b", + "display_name": "Codegemma 1.1 7b", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -7815,29 +7731,26 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 4096 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-12-04", - "last_updated": "2025-12-04", + "attachment": false, + "open_weights": true, + "release_date": "2024-04-30", + "last_updated": "2024-04-30", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "o3", - "name": "o3 (Preview)", - "display_name": "o3 (Preview)", + "id": "google/gemma-3n-e4b-it", + "name": "Gemma 3n E4b It", + "display_name": "Gemma 3n E4b It", "modalities": { "input": [ "text", @@ -7849,33 +7762,30 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2025-06-03", + "last_updated": "2025-06-03", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "google/gemma-2-2b-it", + "name": "Gemma 2 2b It", + "display_name": "Gemma 2 2b It", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -7883,33 +7793,29 @@ }, "limit": { "context": 128000, - "output": 16000 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-16", + "last_updated": "2024-07-16", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "google/gemma-3-12b-it", + "name": "Gemma 3 12b It", + "display_name": "Gemma 3 12b It", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -7917,63 +7823,56 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "claude-3.7-sonnet-thought", - "name": "Claude Sonnet 3.7 Thinking", - "display_name": "Claude Sonnet 3.7 Thinking", + "id": "google/codegemma-7b", + "name": "Codegemma 7b", + "display_name": "Codegemma 7b", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 16384 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "attachment": false, + "open_weights": true, + "release_date": "2024-03-21", + "last_updated": "2024-03-21", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "claude-opus-4.5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "google/gemma-3-1b-it", + "name": "Gemma 3 1b It", + "display_name": "Gemma 3 1b It", "modalities": { "input": [ "text", @@ -7985,33 +7884,29 @@ }, "limit": { "context": 128000, - "output": 16000 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "open_weights": true, + "release_date": "2025-03-10", + "last_updated": "2025-03-10", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "google/gemma-2-27b-it", + "name": "Gemma 2 27b It", + "display_name": "Gemma 2 27b It", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -8019,29 +7914,26 @@ }, "limit": { "context": 128000, - "output": 64000 + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "release_date": "2024-06-24", + "last_updated": "2024-06-24", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "claude-sonnet-4.5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "google/gemma-3-27b-it", + "name": "Gemma-3-27B-IT", + "display_name": "Gemma-3-27B-IT", "modalities": { "input": [ "text", @@ -8052,8 +7944,8 @@ ] }, "limit": { - "context": 128000, - "output": 16000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -8063,30 +7955,22 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2025-09-05", "cost": { "input": 0, "output": 0 - }, - "type": "chat" - } - ] - }, - "mistral": { - "id": "mistral", - "name": "Mistral", - "display_name": "Mistral", - "doc": "https://docs.mistral.ai/getting-started/models/", - "models": [ + } + }, { - "id": "devstral-medium-2507", - "name": "Devstral Medium", - "display_name": "Devstral Medium", + "id": "microsoft/phi-3-medium-128k-instruct", + "name": "Phi 3 Medium 128k Instruct", + "display_name": "Phi 3 Medium 128k Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -8094,28 +7978,27 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-07-10", - "last_updated": "2025-07-10", + "knowledge": "2023-10", + "release_date": "2024-05-07", + "last_updated": "2024-05-07", "cost": { - "input": 0.4, - "output": 2 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "mistral-large-2512", - "name": "Mistral Large 3", - "display_name": "Mistral Large 3", + "id": "microsoft/phi-3-small-128k-instruct", + "name": "Phi 3 Small 128k Instruct", + "display_name": "Phi 3 Small 128k Instruct", "modalities": { "input": [ "text", @@ -8126,8 +8009,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -8136,30 +8019,30 @@ }, "attachment": true, "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2025-12-02", + "knowledge": "2023-10", + "release_date": "2024-05-07", + "last_updated": "2024-05-07", "cost": { - "input": 0.5, - "output": 1.5 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "open-mixtral-8x22b", - "name": "Mixtral 8x22B", - "display_name": "Mixtral 8x22B", + "id": "microsoft/phi-3.5-vision-instruct", + "name": "Phi 3.5 Vision Instruct", + "display_name": "Phi 3.5 Vision Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 64000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -8168,55 +8051,52 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-04-17", - "last_updated": "2024-04-17", + "release_date": "2024-08-16", + "last_updated": "2024-08-16", "cost": { - "input": 2, - "output": 6 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "ministral-8b-latest", - "name": "Ministral 8B", - "display_name": "Ministral 8B", + "id": "microsoft/phi-3-small-8k-instruct", + "name": "Phi 3 Small 8k Instruct", + "display_name": "Phi 3 Small 8k Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 8000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-04", + "knowledge": "2023-10", + "release_date": "2024-05-07", + "last_updated": "2024-05-07", "cost": { - "input": 0.1, - "output": 0.1 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "pixtral-large-latest", - "name": "Pixtral Large", - "display_name": "Pixtral Large", + "id": "microsoft/phi-3.5-moe-instruct", + "name": "Phi 3.5 Moe Instruct", + "display_name": "Phi 3.5 Moe Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -8224,96 +8104,96 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2024-11-04", + "release_date": "2024-08-17", + "last_updated": "2024-08-17", "cost": { - "input": 2, - "output": 6 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "mistral-small-2506", - "name": "Mistral Small 3.2", - "display_name": "Mistral Small 3.2", + "id": "microsoft/phi-4-mini-instruct", + "name": "Phi-4-Mini", + "display_name": "Phi-4-Mini", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-03", - "release_date": "2025-06-20", - "last_updated": "2025-06-20", + "attachment": true, + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2025-09-05", "cost": { - "input": 0.1, - "output": 0.3 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "devstral-2512", - "name": "Devstral 2", - "display_name": "Devstral 2", + "id": "microsoft/phi-3-medium-4k-instruct", + "name": "Phi 3 Medium 4k Instruct", + "display_name": "Phi 3 Medium 4k Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 4000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "knowledge": "2023-10", + "release_date": "2024-05-07", + "last_updated": "2024-05-07", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "ministral-3b-latest", - "name": "Ministral 3B", - "display_name": "Ministral 3B", + "id": "microsoft/phi-3-vision-128k-instruct", + "name": "Phi 3 Vision 128k Instruct", + "display_name": "Phi 3 Vision 128k Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -8321,7 +8201,7 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 4096 }, "temperature": true, "tool_call": true, @@ -8330,118 +8210,112 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-04", + "release_date": "2024-05-19", + "last_updated": "2024-05-19", "cost": { - "input": 0.04, - "output": 0.04 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "pixtral-12b", - "name": "Pixtral 12B", - "display_name": "Pixtral 12B", + "id": "openai/whisper-large-v3", + "name": "Whisper Large v3", + "display_name": "Whisper Large v3", "modalities": { "input": [ - "text", - "image" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 0, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-09", - "release_date": "2024-09-01", - "last_updated": "2024-09-01", + "knowledge": "2023-09", + "release_date": "2023-09-01", + "last_updated": "2025-09-05", "cost": { - "input": 0.15, - "output": 0.15 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "mistral-medium-2505", - "name": "Mistral Medium 3", - "display_name": "Mistral Medium 3", + "id": "openai/gpt-oss-120b", + "name": "GPT-OSS-120B", + "display_name": "GPT-OSS-120B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "knowledge": "2025-08", + "release_date": "2025-08-04", + "last_updated": "2025-08-14", "cost": { - "input": 0.4, - "output": 2 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "labs-devstral-small-2512", - "name": "Devstral Small 2", - "display_name": "Devstral Small 2", + "id": "z-ai/glm4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "devstral-medium-latest", - "name": "Devstral 2", - "display_name": "Devstral 2", + "id": "qwen/qwen3-next-80b-a3b-instruct", + "name": "Qwen3-Next-80B-A3B-Instruct", + "display_name": "Qwen3-Next-80B-A3B-Instruct", "modalities": { "input": [ "text" @@ -8452,7 +8326,7 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -8460,20 +8334,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2025-09-05", "cost": { - "input": 0.4, - "output": 2 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "devstral-small-2505", - "name": "Devstral Small 2505", - "display_name": "Devstral Small 2505", + "id": "qwen/qwen2.5-coder-32b-instruct", + "name": "Qwen2.5 Coder 32b Instruct", + "display_name": "Qwen2.5 Coder 32b Instruct", "modalities": { "input": [ "text" @@ -8484,7 +8357,7 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 4096 }, "temperature": true, "tool_call": true, @@ -8493,52 +8366,47 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "release_date": "2024-11-06", + "last_updated": "2024-11-06", "cost": { - "input": 0.1, - "output": 0.3 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "mistral-medium-2508", - "name": "Mistral Medium 3.1", - "display_name": "Mistral Medium 3.1", + "id": "qwen/qwen2.5-coder-7b-instruct", + "name": "Qwen2.5 Coder 7b Instruct", + "display_name": "Qwen2.5 Coder 7b Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-08-12", - "last_updated": "2025-08-12", + "attachment": false, + "open_weights": true, + "release_date": "2024-09-17", + "last_updated": "2024-09-17", "cost": { - "input": 0.4, - "output": 2 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "mistral-embed", - "name": "Mistral Embed", - "display_name": "Mistral Embed", + "id": "qwen/qwen3-235b-a22b", + "name": "Qwen3-235B-A22B", + "display_name": "Qwen3-235B-A22B", "modalities": { "input": [ "text" @@ -8548,40 +8416,40 @@ ] }, "limit": { - "context": 8000, - "output": 3072 + "context": 131072, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2023-12-11", - "last_updated": "2023-12-11", + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2025-09-05", "cost": { - "input": 0.1, + "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "mistral-small-latest", - "name": "Mistral Small", - "display_name": "Mistral Small", + "id": "qwen/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 66536 }, "temperature": true, "tool_call": true, @@ -8589,20 +8457,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-03", - "release_date": "2024-09-01", - "last_updated": "2024-09-04", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.1, - "output": 0.3 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "magistral-small", - "name": "Magistral Small", - "display_name": "Magistral Small", + "id": "qwen/qwq-32b", + "name": "Qwq 32b", + "display_name": "Qwq 32b", "modalities": { "input": [ "text" @@ -8613,29 +8480,27 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-03-17", - "last_updated": "2025-03-17", + "release_date": "2025-03-05", + "last_updated": "2025-03-05", "cost": { - "input": 0.5, - "output": 1.5 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "devstral-small-2507", - "name": "Devstral Small", - "display_name": "Devstral Small", + "id": "qwen/qwen3-next-80b-a3b-thinking", + "name": "Qwen3-Next-80B-A3B-Thinking", + "display_name": "Qwen3-Next-80B-A3B-Thinking", "modalities": { "input": [ "text" @@ -8645,29 +8510,29 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-07-10", - "last_updated": "2025-07-10", + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2025-09-05", "cost": { - "input": 0.1, - "output": 0.3 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "codestral-latest", - "name": "Codestral", - "display_name": "Codestral", + "id": "mistralai/devstral-2-123b-instruct-2512", + "name": "Devstral-2-123B-Instruct-2512", + "display_name": "Devstral-2-123B-Instruct-2512", "modalities": { "input": [ "text" @@ -8677,93 +8542,93 @@ ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-05-29", - "last_updated": "2025-01-04", + "knowledge": "2025-12", + "release_date": "2025-12-08", + "last_updated": "2025-12-09", "cost": { - "input": 0.3, - "output": 0.9 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "open-mixtral-8x7b", - "name": "Mixtral 8x7B", - "display_name": "Mixtral 8x7B", + "id": "mistralai/mistral-large-3-675b-instruct-2512", + "name": "Mistral Large 3 675B Instruct 2512", + "display_name": "Mistral Large 3 675B Instruct 2512", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-01", - "release_date": "2023-12-11", - "last_updated": "2023-12-11", + "knowledge": "2025-01", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 0.7, - "output": 0.7 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "mistralai/ministral-14b-instruct-2512", + "name": "Ministral 3 14B Instruct 2512", + "display_name": "Ministral 3 14B Instruct 2512", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "knowledge": "2025-12", + "release_date": "2025-12-01", + "last_updated": "2025-12-08", "cost": { - "input": 0.15, - "output": 0.15 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "open-mistral-7b", - "name": "Mistral 7B", - "display_name": "Mistral 7B", + "id": "mistralai/mamba-codestral-7b-v0.1", + "name": "Mamba Codestral 7b V0.1", + "display_name": "Mamba Codestral 7b V0.1", "modalities": { "input": [ "text" @@ -8773,66 +8638,60 @@ ] }, "limit": { - "context": 8000, - "output": 8000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2023-09-27", - "last_updated": "2023-09-27", + "release_date": "2024-07-16", + "last_updated": "2024-07-16", "cost": { - "input": 0.25, - "output": 0.25 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "mistral-large-latest", - "name": "Mistral Large", - "display_name": "Mistral Large", + "id": "mistralai/mistral-large-2-instruct", + "name": "Mistral Large 2 Instruct", + "display_name": "Mistral Large 2 Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 - }, + "context": 128000, + "output": 4096 + }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2025-12-02", + "release_date": "2024-07-24", + "last_updated": "2024-07-24", "cost": { - "input": 0.5, - "output": 1.5 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "mistral-medium-latest", - "name": "Mistral Medium", - "display_name": "Mistral Medium", + "id": "mistralai/codestral-22b-instruct-v0.1", + "name": "Codestral 22b Instruct V0.1", + "display_name": "Codestral 22b Instruct V0.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -8840,7 +8699,7 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 4096 }, "temperature": true, "tool_call": true, @@ -8849,19 +8708,17 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-05-07", - "last_updated": "2025-05-10", + "release_date": "2024-05-29", + "last_updated": "2024-05-29", "cost": { - "input": 0.4, - "output": 2 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "mistral-large-2411", - "name": "Mistral Large 2.1", - "display_name": "Mistral Large 2.1", + "id": "mistralai/mistral-small-3.1-24b-instruct-2503", + "name": "Mistral Small 3.1 24b Instruct 2503", + "display_name": "Mistral Small 3.1 24b Instruct 2503", "modalities": { "input": [ "text" @@ -8871,8 +8728,8 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -8881,22 +8738,21 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2024-11-04", + "release_date": "2025-03-11", + "last_updated": "2025-03-11", "cost": { - "input": 2, - "output": 6 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "magistral-medium-latest", - "name": "Magistral Medium", - "display_name": "Magistral Medium", + "id": "meta/llama-3.2-11b-vision-instruct", + "name": "Llama 3.2 11b Vision Instruct", + "display_name": "Llama 3.2 11b Vision Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -8904,140 +8760,122 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-03-17", - "last_updated": "2025-03-20", + "knowledge": "2023-12", + "release_date": "2024-09-18", + "last_updated": "2024-09-18", "cost": { - "input": 2, - "output": 5 - }, - "type": "chat" - } - ] - }, - "abacus": { - "id": "abacus", - "name": "Abacus", - "display_name": "Abacus", - "api": "https://routellm.abacus.ai/v1/chat/completions", - "doc": "https://abacus.ai/help/api", - "models": [ + "input": 0, + "output": 0 + } + }, { - "id": "gpt-4.1-nano", - "name": "GPT-4.1 Nano", - "display_name": "GPT-4.1 Nano", + "id": "meta/llama3-70b-instruct", + "name": "Llama3 70b Instruct", + "display_name": "Llama3 70b Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "release_date": "2024-04-17", + "last_updated": "2024-04-17", "cost": { - "input": 0.1, - "output": 0.4 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "grok-4-fast-non-reasoning", - "name": "Grok 4 Fast (Non-Reasoning)", - "display_name": "Grok 4 Fast (Non-Reasoning)", + "id": "meta/llama-3.3-70b-instruct", + "name": "Llama 3.3 70b Instruct", + "display_name": "Llama 3.3 70b Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 16384 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "attachment": false, + "open_weights": true, + "release_date": "2024-11-26", + "last_updated": "2024-11-26", "cost": { - "input": 0.2, - "output": 0.5 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "gemini-2.0-flash-001", - "name": "Gemini 2.0 Flash", - "display_name": "Gemini 2.0 Flash", + "id": "meta/llama-3.2-1b-instruct", + "name": "Llama 3.2 1b Instruct", + "display_name": "Llama 3.2 1b Instruct", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2025-02-05", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-18", + "last_updated": "2024-09-18", "cost": { - "input": 0.1, - "output": 0.4 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "deepseek-ai-DeepSeek-V3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "meta/llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17b 16e Instruct", + "display_name": "Llama 4 Scout 17b 16e Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -9045,31 +8883,31 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-06-15", - "last_updated": "2025-06-15", + "knowledge": "2024-02", + "release_date": "2025-04-02", + "last_updated": "2025-04-02", "cost": { - "input": 0.27, - "output": 0.4 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "meta-llama-Meta-Llama-3.1-405B-Instruct-Turbo", - "name": "Llama 3.1 405B Instruct Turbo", - "display_name": "Llama 3.1 405B Instruct Turbo", + "id": "meta/llama-4-maverick-17b-128e-instruct", + "name": "Llama 4 Maverick 17b 128e Instruct", + "display_name": "Llama 4 Maverick 17b 128e Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -9084,57 +8922,50 @@ "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2024-02", + "release_date": "2025-04-01", + "last_updated": "2025-04-01", "cost": { - "input": 3.5, - "output": 3.5 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "meta/codellama-70b", + "name": "Codellama 70b", + "display_name": "Codellama 70b", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "attachment": false, + "open_weights": true, + "release_date": "2024-01-29", + "last_updated": "2024-01-29", "cost": { - "input": 0.5, - "output": 3 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "Qwen-Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct", - "display_name": "Qwen3 235B A22B Instruct", + "id": "meta/llama-3.1-405b-instruct", + "name": "Llama 3.1 405b Instruct", + "display_name": "Llama 3.1 405b Instruct", "modalities": { "input": [ "text" @@ -9144,29 +8975,27 @@ ] }, "limit": { - "context": 262144, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "release_date": "2024-07-16", + "last_updated": "2024-07-16", "cost": { - "input": 0.13, - "output": 0.6 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "meta-llama-Meta-Llama-3.1-8B-Instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "meta/llama3-8b-instruct", + "name": "Llama3 8b Instruct", + "display_name": "Llama3 8b Instruct", "modalities": { "input": [ "text" @@ -9186,50 +9015,47 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2024-04-17", + "last_updated": "2024-04-17", "cost": { - "input": 0.02, - "output": 0.05 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "meta/llama-3.1-70b-instruct", + "name": "Llama 3.1 70b Instruct", + "display_name": "Llama 3.1 70b Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-01", - "last_updated": "2025-09-01", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-16", + "last_updated": "2024-07-16", "cost": { - "input": 0.2, - "output": 1.5 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "deepseek-ai-DeepSeek-R1", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", + "id": "deepseek-ai/deepseek-r1-0528", + "name": "Deepseek R1 0528", + "display_name": "Deepseek R1 0528", "modalities": { "input": [ "text" @@ -9240,7 +9066,7 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 4096 }, "temperature": true, "tool_call": true, @@ -9250,18 +9076,17 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 3, - "output": 7 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "kimi-k2-turbo-preview", - "name": "Kimi K2 Turbo Preview", - "display_name": "Kimi K2 Turbo Preview", + "id": "deepseek-ai/deepseek-r1", + "name": "Deepseek R1", + "display_name": "Deepseek R1", "modalities": { "input": [ "text" @@ -9271,42 +9096,39 @@ ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-08", - "last_updated": "2025-07-08", + "open_weights": true, + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.15, - "output": 8 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "deepseek-ai/deepseek-v3.1-terminus", + "name": "DeepSeek V3.1 Terminus", + "display_name": "DeepSeek V3.1 Terminus", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -9314,20 +9136,20 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-06-01", - "last_updated": "2025-06-01", + "knowledge": "2025-01", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 2, - "output": 12 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "qwen-qwen3-coder-480b-a35b-instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "deepseek-ai/deepseek-v3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ "text" @@ -9337,8 +9159,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -9347,33 +9169,29 @@ "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-07-22", - "last_updated": "2025-07-22", + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2025-08-20", + "last_updated": "2025-08-26", "cost": { - "input": 0.29, - "output": 1.2 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "deepseek-ai/deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 163840, "output": 65536 }, "temperature": true, @@ -9382,89 +9200,89 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.3, - "output": 2.5 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "gpt-4.1-mini", - "name": "GPT-4.1 Mini", - "display_name": "GPT-4.1 Mini", + "id": "deepseek-ai/deepseek-coder-6.7b-instruct", + "name": "Deepseek Coder 6.7b Instruct", + "display_name": "Deepseek Coder 6.7b Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "release_date": "2023-10-29", + "last_updated": "2023-10-29", "cost": { - "input": 0.4, - "output": 1.6 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "claude-opus-4-5-20251101", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "black-forest-labs/flux.1-dev", + "name": "FLUX.1-dev", + "display_name": "FLUX.1-dev", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 200000, - "output": 64000 - }, + "context": 4096, + "output": 0 + }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-01", - "last_updated": "2025-11-01", + "knowledge": "2024-08", + "release_date": "2024-08-01", + "last_updated": "2025-09-05", "cost": { - "input": 5, - "output": 25 - }, - "type": "chat" - }, + "input": 0, + "output": 0 + } + } + ] + }, + "cohere": { + "id": "cohere", + "name": "Cohere", + "display_name": "Cohere", + "doc": "https://docs.cohere.com/docs/models", + "models": [ { - "id": "qwen-2.5-coder-32b", - "name": "Qwen 2.5 Coder 32B", - "display_name": "Qwen 2.5 Coder 32B", + "id": "command-a-translate-08-2025", + "name": "Command A Translate", + "display_name": "Command A Translate", "modalities": { "input": [ "text" @@ -9474,8 +9292,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 8000, + "output": 8000 }, "temperature": true, "tool_call": true, @@ -9484,31 +9302,29 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-11-11", - "last_updated": "2024-11-11", + "knowledge": "2024-06-01", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 0.79, - "output": 0.79 - }, - "type": "chat" + "input": 2.5, + "output": 10 + } }, { - "id": "claude-sonnet-4-5-20250929", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "command-a-03-2025", + "name": "Command A", + "display_name": "Command A", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 256000, + "output": 8000 }, "temperature": true, "tool_call": true, @@ -9516,25 +9332,23 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 3, - "output": 15 - }, - "type": "chat" + "input": 2.5, + "output": 10 + } }, { - "id": "openai-gpt-oss-120b", - "name": "GPT-OSS 120B", - "display_name": "GPT-OSS 120B", + "id": "command-r-08-2024", + "name": "Command R", + "display_name": "Command R", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -9542,7 +9356,7 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 4000 }, "temperature": true, "tool_call": true, @@ -9550,20 +9364,20 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 0.08, - "output": 0.44 - }, - "type": "chat" + "input": 0.15, + "output": 0.6 + } }, { - "id": "qwen-qwen3-Max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "command-r-plus-08-2024", + "name": "Command R+", + "display_name": "Command R+", "modalities": { "input": [ "text" @@ -9573,8 +9387,8 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, @@ -9583,52 +9397,50 @@ "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 1.2, - "output": 6 - }, - "type": "chat" + "input": 2.5, + "output": 10 + } }, { - "id": "grok-4-0709", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "command-r7b-12-2024", + "name": "Command R7B", + "display_name": "Command R7B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-02-27", + "last_updated": "2024-02-27", "cost": { - "input": 3, - "output": 15 - }, - "type": "chat" + "input": 0.0375, + "output": 0.15 + } }, { - "id": "meta-llama-Meta-Llama-3.1-70B-Instruct", - "name": "Llama 3.1 70B Instruct", - "display_name": "Llama 3.1 70B Instruct", + "id": "command-a-reasoning-08-2025", + "name": "Command A Reasoning", + "display_name": "Command A Reasoning", "modalities": { "input": [ "text" @@ -9638,61 +9450,70 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2024-06-01", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0.4, - "output": 0.4 - }, - "type": "chat" + "input": 2.5, + "output": 10 + } }, { - "id": "o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "command-a-vision-07-2025", + "name": "Command A Vision", + "display_name": "Command A Vision", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 8000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-07-31", + "last_updated": "2025-07-31", "cost": { - "input": 1.1, - "output": 4.4 - }, - "type": "chat" - }, + "input": 2.5, + "output": 10 + } + } + ] + }, + "upstage": { + "id": "upstage", + "name": "Upstage", + "display_name": "Upstage", + "api": "https://api.upstage.ai/v1/solar", + "doc": "https://developers.upstage.ai/docs/apis/chat", + "models": [ { - "id": "zai-org-glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "solar-mini", + "name": "solar-mini", + "display_name": "solar-mini", "modalities": { "input": [ "text" @@ -9702,228 +9523,225 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 32768, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": false, + "knowledge": "2024-09", + "release_date": "2024-06-12", + "last_updated": "2025-04-22", "cost": { - "input": 0.6, - "output": 2.2 - }, - "type": "chat" + "input": 0.15, + "output": 0.15 + } }, { - "id": "gemini-2.0-pro-exp-02-05", - "name": "Gemini 2.0 Pro Exp", - "display_name": "Gemini 2.0 Pro Exp", + "id": "solar-pro3", + "name": "solar-pro3", + "display_name": "solar-pro3", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, + "context": 131072, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2025-02-05", - "type": "chat" + "knowledge": "2025-03", + "release_date": "2026-01", + "last_updated": "2026-01", + "cost": { + "input": 0.25, + "output": 0.25 + } }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "solar-pro2", + "name": "solar-pro2", + "display_name": "solar-pro2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 65536, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-03", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 1.25, - "output": 10 - }, - "type": "chat" - }, + "input": 0.25, + "output": 0.25 + } + } + ] + }, + "groq": { + "id": "groq", + "name": "Groq", + "display_name": "Groq", + "doc": "https://console.groq.com/docs/models", + "models": [ { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "llama-3.1-8b-instant", + "name": "Llama 3.1 8B Instant", + "display_name": "Llama 3.1 8B Instant", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { "input": 0.05, - "output": 0.4 - }, - "type": "chat" + "output": 0.08 + } }, { - "id": "claude-sonnet-4-20250514", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "mistral-saba-24b", + "name": "Mistral Saba 24B", + "display_name": "Mistral Saba 24B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-14", - "last_updated": "2025-05-14", + "knowledge": "2024-08", + "release_date": "2025-02-06", + "last_updated": "2025-02-06", "cost": { - "input": 3, - "output": 15 - }, - "type": "chat" + "input": 0.79, + "output": 0.79 + } }, { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "llama3-8b-8192", + "name": "Llama 3 8B", + "display_name": "Llama 3 8B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "knowledge": "2023-03", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 2, - "output": 8 - }, - "type": "chat" + "input": 0.05, + "output": 0.08 + } }, { - "id": "o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "qwen-qwq-32b", + "name": "Qwen QwQ 32B", + "display_name": "Qwen QwQ 32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "attachment": false, + "open_weights": true, + "knowledge": "2024-09", + "release_date": "2024-11-27", + "last_updated": "2024-11-27", "cost": { - "input": 1.1, - "output": 4.4 - }, - "type": "chat" + "input": 0.29, + "output": 0.39 + } }, { - "id": "Qwen-Qwen3-32B", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "llama3-70b-8192", + "name": "Llama 3 70B", + "display_name": "Llama 3 70B", "modalities": { "input": [ "text" @@ -9933,42 +9751,39 @@ ] }, "limit": { - "context": 128000, + "context": 8192, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "knowledge": "2023-03", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 0.09, - "output": 0.29 - }, - "type": "chat" + "input": 0.59, + "output": 0.79 + } }, { - "id": "claude-opus-4-20250514", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -9976,156 +9791,143 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-14", - "last_updated": "2025-05-14", + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 15, - "output": 75 - }, - "type": "chat" + "input": 0.75, + "output": 0.99 + } }, { - "id": "gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "llama-guard-3-8b", + "name": "Llama Guard 3 8B", + "display_name": "Llama Guard 3 8B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 8192, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.25, - "output": 2 - }, - "type": "chat" + "input": 0.2, + "output": 0.2 + } }, { - "id": "meta-llama-Llama-4-Maverick-17B-128E-Instruct-FP8", - "name": "Llama 4 Maverick 17B 128E Instruct FP8", - "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", + "id": "gemma2-9b-it", + "name": "Gemma 2 9B", + "display_name": "Gemma 2 9B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2024-06", + "release_date": "2024-06-27", + "last_updated": "2024-06-27", "cost": { - "input": 0.14, - "output": 0.59 - }, - "type": "chat" + "input": 0.2, + "output": 0.2 + } }, { - "id": "o3-pro", - "name": "o3-pro", - "display_name": "o3-pro", + "id": "llama-3.3-70b-versatile", + "name": "Llama 3.3 70B Versatile", + "display_name": "Llama 3.3 70B Versatile", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-06-10", - "last_updated": "2025-06-10", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 20, - "output": 80 - }, - "type": "chat" + "input": 0.59, + "output": 0.79 + } }, { - "id": "claude-3-7-sonnet-20250219", - "name": "Claude Sonnet 3.7", - "display_name": "Claude Sonnet 3.7", + "id": "moonshotai/kimi-k2-instruct-0905", + "name": "Kimi K2 Instruct 0905", + "display_name": "Kimi K2 Instruct 0905", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 3, - "output": 15 - }, - "type": "chat" + "input": 1, + "output": 3 + } }, { - "id": "deepseek-ai-DeepSeek-V3.1-Terminus", - "name": "DeepSeek V3.1 Terminus", - "display_name": "DeepSeek V3.1 Terminus", + "id": "moonshotai/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ "text" @@ -10135,43 +9937,38 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-06-01", - "last_updated": "2025-06-01", + "knowledge": "2024-10", + "release_date": "2025-07-14", + "last_updated": "2025-07-14", "cost": { - "input": 0.27, - "output": 1 - }, - "type": "chat" + "input": 1, + "output": 3 + } }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 131072, "output": 65536 }, "temperature": true, @@ -10180,99 +9977,93 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1.25, - "output": 10 - }, - "type": "chat" + "input": 0.075, + "output": 0.3 + } }, { - "id": "gpt-4o-2024-11-20", - "name": "GPT-4o (2024-11-20)", - "display_name": "GPT-4o (2024-11-20)", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-11-20", - "last_updated": "2024-11-20", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 2.5, - "output": 10 - }, - "type": "chat" + "input": 0.15, + "output": 0.6 + } }, { - "id": "o3", - "name": "o3", - "display_name": "o3", + "id": "qwen/qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "attachment": false, + "open_weights": true, + "knowledge": "2024-11-08", + "release_date": "2024-12-23", + "last_updated": "2024-12-23", "cost": { - "input": 2, - "output": 8 - }, - "type": "chat" + "input": 0.29, + "output": 0.59 + } }, { - "id": "Qwen-Qwen2.5-72B-Instruct", - "name": "Qwen 2.5 72B Instruct", - "display_name": "Qwen 2.5 72B Instruct", + "id": "meta-llama/llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17B", + "display_name": "Llama 4 Scout 17B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, "temperature": true, @@ -10282,28 +10073,29 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-09-19", - "last_updated": "2024-09-19", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { "input": 0.11, - "output": 0.38 - }, - "type": "chat" + "output": 0.34 + } }, { - "id": "zai-org-glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "meta-llama/llama-4-maverick-17b-128e-instruct", + "name": "Llama 4 Maverick 17B", + "display_name": "Llama 4 Maverick 17B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, "temperature": true, @@ -10313,50 +10105,58 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-03-01", - "last_updated": "2025-03-01", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.6, - "output": 2.2 - }, - "type": "chat" + "input": 0.2, + "output": 0.6 + } }, { - "id": "deepseek-deepseek-v3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "meta-llama/llama-guard-4-12b", + "name": "Llama Guard 4 12B", + "display_name": "Llama Guard 4 12B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-08-01", - "last_updated": "2025-08-01", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.55, - "output": 1.66 - }, - "type": "chat" - }, + "input": 0.2, + "output": 0.2 + } + } + ] + }, + "bailing": { + "id": "bailing", + "name": "Bailing", + "display_name": "Bailing", + "api": "https://api.tbox.cn/api/llm/v1/chat/completions", + "doc": "https://alipaytbox.yuque.com/sxs0ba/ling/intro", + "models": [ { - "id": "Qwen-QwQ-32B", - "name": "QwQ 32B", - "display_name": "QwQ 32B", + "id": "Ling-1T", + "name": "Ling-1T", + "display_name": "Ling-1T", "modalities": { "input": [ "text" @@ -10366,33 +10166,31 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-11-28", - "last_updated": "2024-11-28", + "knowledge": "2024-06", + "release_date": "2025-10", + "last_updated": "2025-10", "cost": { - "input": 0.4, - "output": 0.4 - }, - "type": "chat" + "input": 0.57, + "output": 2.29 + } }, { - "id": "gpt-4o-mini", - "name": "GPT-4o Mini", - "display_name": "GPT-4o Mini", + "id": "Ring-1T", + "name": "Ring-1T", + "display_name": "Ring-1T", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -10400,42 +10198,53 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2025-10", + "last_updated": "2025-10", "cost": { - "input": 0.15, - "output": 0.6 - }, - "type": "chat" - }, + "input": 0.57, + "output": 2.29 + } + } + ] + }, + "github-copilot": { + "id": "github-copilot", + "name": "GitHub Copilot", + "display_name": "GitHub Copilot", + "api": "https://api.githubcopilot.com", + "doc": "https://docs.github.com/en/copilot", + "models": [ { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash", + "display_name": "Gemini 3 Flash", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -10443,19 +10252,18 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 1.25, - "output": 10 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "grok-4-1-fast-non-reasoning", - "name": "Grok 4.1 Fast (Non-Reasoning)", - "display_name": "Grok 4.1 Fast (Non-Reasoning)", + "id": "gpt-5.2-codex", + "name": "GPT-5.2-Codex", + "display_name": "GPT-5.2-Codex", "modalities": { "input": [ "text", @@ -10466,28 +10274,29 @@ ] }, "limit": { - "context": 2000000, - "output": 16384 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-17", - "last_updated": "2025-11-17", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.2, - "output": 0.5 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "llama-3.3-70b-versatile", - "name": "Llama 3.3 70B Versatile", - "display_name": "Llama 3.3 70B Versatile", + "id": "grok-code-fast-1", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ "text" @@ -10498,61 +10307,61 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": false, + "knowledge": "2025-08", + "release_date": "2025-08-27", + "last_updated": "2025-08-27", "cost": { - "input": 0.59, - "output": 0.79 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "claude-opus-4-1-20250805", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "gpt-5.1-codex", + "name": "GPT-5.1-Codex", + "display_name": "GPT-5.1-Codex", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 128000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 15, - "output": 75 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", @@ -10563,10 +10372,10 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 16000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -10574,19 +10383,53 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 1.75, - "output": 14 + "input": 0, + "output": 0 + } + }, + { + "id": "gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] }, - "type": "chat" + "limit": { + "context": 128000, + "output": 64000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "gpt-5.1-chat-latest", - "name": "GPT-5.1 Chat Latest", - "display_name": "GPT-5.1 Chat Latest", + "id": "gpt-5.1-codex-mini", + "name": "GPT-5.1-Codex-mini", + "display_name": "GPT-5.1-Codex-mini", "modalities": { "input": [ "text", @@ -10597,8 +10440,8 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 100000 }, "temperature": false, "tool_call": true, @@ -10606,36 +10449,34 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2024-09-30", "release_date": "2025-11-13", "last_updated": "2025-11-13", "cost": { - "input": 1.25, - "output": 10 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "claude-haiku-4-5-20251001", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -10643,37 +10484,29 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 1, - "output": 5 - }, - "type": "chat" - } - ] - }, - "vercel": { - "id": "vercel", - "name": "Vercel AI Gateway", - "display_name": "Vercel AI Gateway", - "doc": "https://github.com/vercel/ai/tree/5eb85cc45a259553501f535b8ac79a77d0e79223/packages/gateway", - "models": [ + "input": 0, + "output": 0 + } + }, { - "id": "moonshotai/kimi-k2", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 64000, "output": 16384 }, "temperature": true, @@ -10681,53 +10514,52 @@ "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-14", - "last_updated": "2025-07-14", + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 1, - "output": 3 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "alibaba/qwen3-next-80b-a3b-instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-12", - "last_updated": "2025-09-12", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.5, - "output": 2 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "alibaba/qwen3-vl-instruct", - "name": "Qwen3 VL Instruct", - "display_name": "Qwen3 VL Instruct", + "id": "claude-opus-41", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ "text", @@ -10738,29 +10570,29 @@ ] }, "limit": { - "context": 131072, - "output": 129024 + "context": 80000, + "output": 16000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.7, - "output": 2.8 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "alibaba/qwen3-vl-thinking", - "name": "Qwen3 VL Thinking", - "display_name": "Qwen3 VL Thinking", + "id": "gpt-5-mini", + "name": "GPT-5-mini", + "display_name": "GPT-5-mini", "modalities": { "input": [ "text", @@ -10771,8 +10603,8 @@ ] }, "limit": { - "context": 131072, - "output": 129024 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -10781,95 +10613,98 @@ "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2025-09", - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2025-08-13", + "last_updated": "2025-08-13", "cost": { - "input": 0.7, - "output": 8.4 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "alibaba/qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 1.2, - "output": 6 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "alibaba/qwen3-coder-plus", - "name": "Qwen3 Coder Plus", - "display_name": "Qwen3 Coder Plus", + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1-Codex-max", + "display_name": "GPT-5.1-Codex-max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 128000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-12-04", + "last_updated": "2025-12-04", "cost": { - "input": 1, - "output": 5 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "alibaba/qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen3 Next 80B A3B Thinking", + "id": "claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 16000 }, "temperature": true, "tool_call": true, @@ -10877,32 +10712,32 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-09", - "release_date": "2025-09-12", - "last_updated": "2025-09-12", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.5, - "output": 6 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "xai/grok-3-mini-fast", - "name": "Grok 3 Mini Fast", - "display_name": "Grok 3 Mini Fast", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -10910,34 +10745,32 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.6, - "output": 4, - "reasoning": 4, - "cache_read": 0.15 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "xai/grok-3-mini", - "name": "Grok 3 Mini", - "display_name": "Grok 3 Mini", + "id": "claude-opus-4.5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16000 }, "temperature": true, "tool_call": true, @@ -10945,23 +10778,20 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", "cost": { - "input": 0.3, - "output": 0.5, - "reasoning": 0.5, - "cache_read": 0.075 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "xai/grok-4-fast", - "name": "Grok 4 Fast", - "display_name": "Grok 4 Fast", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", @@ -10972,10 +10802,10 @@ ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 128000, + "output": 64000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -10983,86 +10813,92 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "xai/grok-3", - "name": "Grok 3", - "display_name": "Grok 3", + "id": "claude-sonnet-4.5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2025-03-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "xai/grok-2", - "name": "Grok 2", - "display_name": "Grok 2", + "id": "claude-opus-4.6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "knowledge": "2025-03-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 2, - "output": 10, - "cache_read": 2 - }, - "type": "chat" - }, + "input": 0, + "output": 0 + } + } + ] + }, + "mistral": { + "id": "mistral", + "name": "Mistral", + "display_name": "Mistral", + "doc": "https://docs.mistral.ai/getting-started/models/", + "models": [ { - "id": "xai/grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "devstral-medium-2507", + "name": "Devstral Medium", + "display_name": "Devstral Medium", "modalities": { "input": [ "text" @@ -11072,31 +10908,28 @@ ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2025-07-10", + "last_updated": "2025-07-10", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 - }, - "type": "chat" + "input": 0.4, + "output": 2 + } }, { - "id": "xai/grok-2-vision", - "name": "Grok 2 Vision", - "display_name": "Grok 2 Vision", + "id": "mistral-large-2512", + "name": "Mistral Large 3", + "display_name": "Mistral Large 3", "modalities": { "input": [ "text", @@ -11107,8 +10940,8 @@ ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -11116,21 +10949,19 @@ "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2025-12-02", "cost": { - "input": 2, - "output": 10, - "cache_read": 2 - }, - "type": "chat" + "input": 0.5, + "output": 1.5 + } }, { - "id": "xai/grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "open-mixtral-8x22b", + "name": "Mixtral 8x22B", + "display_name": "Mixtral 8x22B", "modalities": { "input": [ "text" @@ -11140,32 +10971,28 @@ ] }, "limit": { - "context": 256000, + "context": 64000, "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-04-17", + "last_updated": "2024-04-17", "cost": { - "input": 3, - "output": 15, - "reasoning": 15, - "cache_read": 0.75 - }, - "type": "chat" + "input": 2, + "output": 6 + } }, { - "id": "xai/grok-3-fast", - "name": "Grok 3 Fast", - "display_name": "Grok 3 Fast", + "id": "ministral-8b-latest", + "name": "Ministral 8B", + "display_name": "Ministral 8B", "modalities": { "input": [ "text" @@ -11175,8 +11002,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -11184,21 +11011,19 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-04", "cost": { - "input": 5, - "output": 25, - "cache_read": 1.25 - }, - "type": "chat" + "input": 0.1, + "output": 0.1 + } }, { - "id": "xai/grok-4-fast-non-reasoning", - "name": "Grok 4 Fast (Non-Reasoning)", - "display_name": "Grok 4 Fast (Non-Reasoning)", + "id": "pixtral-large-latest", + "name": "Pixtral Large", + "display_name": "Pixtral Large", "modalities": { "input": [ "text", @@ -11209,8 +11034,8 @@ ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -11218,32 +11043,31 @@ "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2024-11-04", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 - }, - "type": "chat" + "input": 2, + "output": 6 + } }, { - "id": "mistral/codestral", - "name": "Codestral", - "display_name": "Codestral", + "id": "mistral-small-2506", + "name": "Mistral Small 3.2", + "display_name": "Mistral Small 3.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -11252,19 +11076,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-05-29", - "last_updated": "2025-01-04", + "knowledge": "2025-03", + "release_date": "2025-06-20", + "last_updated": "2025-06-20", "cost": { - "input": 0.3, - "output": 0.9 - }, - "type": "chat" + "input": 0.1, + "output": 0.3 + } }, { - "id": "mistral/magistral-medium", - "name": "Magistral Medium", - "display_name": "Magistral Medium", + "id": "devstral-2512", + "name": "Devstral 2", + "display_name": "Devstral 2", "modalities": { "input": [ "text" @@ -11274,63 +11097,59 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-03-17", - "last_updated": "2025-03-20", + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", "cost": { - "input": 2, - "output": 5 - }, - "type": "chat" + "input": 0.4, + "output": 2 + } }, { - "id": "mistral/mistral-large", - "name": "Mistral Large", - "display_name": "Mistral Large", + "id": "ministral-3b-latest", + "name": "Ministral 3B", + "display_name": "Ministral 3B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2025-12-02", + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-04", "cost": { - "input": 0.5, - "output": 1.5 - }, - "type": "chat" + "input": 0.04, + "output": 0.04 + } }, { - "id": "mistral/pixtral-large", - "name": "Pixtral Large", - "display_name": "Pixtral Large", + "id": "pixtral-12b", + "name": "Pixtral 12B", + "display_name": "Pixtral 12B", "modalities": { "input": [ "text", @@ -11351,62 +11170,62 @@ }, "attachment": true, "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2024-11-04", + "knowledge": "2024-09", + "release_date": "2024-09-01", + "last_updated": "2024-09-01", "cost": { - "input": 2, - "output": 6 - }, - "type": "chat" + "input": 0.15, + "output": 0.15 + } }, { - "id": "mistral/ministral-8b", - "name": "Ministral 8B", - "display_name": "Ministral 8B", + "id": "mistral-medium-2505", + "name": "Mistral Medium 3", + "display_name": "Mistral Medium 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-04", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 0.1, - "output": 0.1 - }, - "type": "chat" + "input": 0.4, + "output": 2 + } }, { - "id": "mistral/ministral-3b", - "name": "Ministral 3B", - "display_name": "Ministral 3B", + "id": "labs-devstral-small-2512", + "name": "Devstral Small 2", + "display_name": "Devstral Small 2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -11415,19 +11234,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-04", + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", "cost": { - "input": 0.04, - "output": 0.04 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "mistral/magistral-small", - "name": "Magistral Small", - "display_name": "Magistral Small", + "id": "devstral-medium-latest", + "name": "Devstral 2", + "display_name": "Devstral 2", "modalities": { "input": [ "text" @@ -11437,34 +11255,31 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-03-17", - "last_updated": "2025-03-17", + "knowledge": "2025-12", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 0.5, - "output": 1.5 - }, - "type": "chat" + "input": 0.4, + "output": 2 + } }, { - "id": "mistral/mistral-small", - "name": "Mistral Small", - "display_name": "Mistral Small", + "id": "devstral-small-2505", + "name": "Devstral Small 2505", + "display_name": "Devstral Small 2505", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -11472,7 +11287,7 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 128000 }, "temperature": true, "tool_call": true, @@ -11481,19 +11296,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-03", - "release_date": "2024-09-01", - "last_updated": "2024-09-04", + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { "input": 0.1, "output": 0.3 - }, - "type": "chat" + } }, { - "id": "mistral/pixtral-12b", - "name": "Pixtral 12B", - "display_name": "Pixtral 12B", + "id": "mistral-medium-2508", + "name": "Mistral Medium 3.1", + "display_name": "Mistral Medium 3.1", "modalities": { "input": [ "text", @@ -11504,8 +11318,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -11513,20 +11327,19 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2024-09", - "release_date": "2024-09-01", - "last_updated": "2024-09-01", + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2025-08-12", + "last_updated": "2025-08-12", "cost": { - "input": 0.15, - "output": 0.15 - }, - "type": "chat" + "input": 0.4, + "output": 2 + } }, { - "id": "mistral/mixtral-8x22b-instruct", - "name": "Mixtral 8x22B", - "display_name": "Mixtral 8x22B", + "id": "mistral-embed", + "name": "Mistral Embed", + "display_name": "Mistral Embed", "modalities": { "input": [ "text" @@ -11536,29 +11349,27 @@ ] }, "limit": { - "context": 64000, - "output": 64000 + "context": 8000, + "output": 3072 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-04-17", - "last_updated": "2024-04-17", + "open_weights": false, + "release_date": "2023-12-11", + "last_updated": "2023-12-11", "cost": { - "input": 2, - "output": 6 - }, - "type": "chat" + "input": 0.1, + "output": 0 + } }, { - "id": "vercel/v0-1.0-md", - "name": "v0-1.0-md", - "display_name": "v0-1.0-md", + "id": "mistral-small-latest", + "name": "Mistral Small", + "display_name": "Mistral Small", "modalities": { "input": [ "text", @@ -11570,32 +11381,30 @@ }, "limit": { "context": 128000, - "output": 32000 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "knowledge": "2025-03", + "release_date": "2024-09-01", + "last_updated": "2024-09-04", "cost": { - "input": 3, - "output": 15 - }, - "type": "chat" + "input": 0.1, + "output": 0.3 + } }, { - "id": "vercel/v0-1.5-md", - "name": "v0-1.5-md", - "display_name": "v0-1.5-md", + "id": "magistral-small", + "name": "Magistral Small", + "display_name": "Magistral Small", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -11603,7 +11412,7 @@ }, "limit": { "context": 128000, - "output": 32000 + "output": 128000 }, "temperature": true, "tool_call": true, @@ -11611,20 +11420,20 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-06-09", - "last_updated": "2025-06-09", + "attachment": false, + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2025-03-17", + "last_updated": "2025-03-17", "cost": { - "input": 3, - "output": 15 - }, - "type": "chat" + "input": 0.5, + "output": 1.5 + } }, { - "id": "deepseek/deepseek-v3.2-exp-thinking", - "name": "DeepSeek V3.2 Exp Thinking", - "display_name": "DeepSeek V3.2 Exp Thinking", + "id": "devstral-small-2507", + "name": "Devstral Small", + "display_name": "Devstral Small", "modalities": { "input": [ "text" @@ -11634,30 +11443,28 @@ ] }, "limit": { - "context": 163840, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2025-07-10", + "last_updated": "2025-07-10", "cost": { - "input": 0.28, - "output": 0.42 - }, - "type": "chat" + "input": 0.1, + "output": 0.3 + } }, { - "id": "deepseek/deepseek-v3.1-terminus", - "name": "DeepSeek V3.1 Terminus", - "display_name": "DeepSeek V3.1 Terminus", + "id": "codestral-latest", + "name": "Codestral", + "display_name": "Codestral", "modalities": { "input": [ "text" @@ -11667,30 +11474,28 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 256000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "knowledge": "2024-10", + "release_date": "2024-05-29", + "last_updated": "2025-01-04", "cost": { - "input": 0.27, - "output": 1 - }, - "type": "chat" + "input": 0.3, + "output": 0.9 + } }, { - "id": "deepseek/deepseek-v3.2-exp", - "name": "DeepSeek V3.2 Exp", - "display_name": "DeepSeek V3.2 Exp", + "id": "open-mixtral-8x7b", + "name": "Mixtral 8x7B", + "display_name": "Mixtral 8x7B", "modalities": { "input": [ "text" @@ -11700,8 +11505,8 @@ ] }, "limit": { - "context": 163840, - "output": 8192 + "context": 32000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -11709,20 +11514,19 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "open_weights": true, + "knowledge": "2024-01", + "release_date": "2023-12-11", + "last_updated": "2023-12-11", "cost": { - "input": 0.28, - "output": 0.42 - }, - "type": "chat" + "input": 0.7, + "output": 0.7 + } }, { - "id": "deepseek/deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text" @@ -11732,30 +11536,28 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0.75, - "output": 0.99 - }, - "type": "chat" + "input": 0.15, + "output": 0.15 + } }, { - "id": "deepseek/deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "open-mistral-7b", + "name": "Mistral 7B", + "display_name": "Mistral 7B", "modalities": { "input": [ "text" @@ -11765,161 +11567,134 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 8000, + "output": 8000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-05-29", - "cost": { - "input": 1.35, - "output": 5.4 - }, - "type": "chat" + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2023-09-27", + "last_updated": "2023-09-27", + "cost": { + "input": 0.25, + "output": 0.25 + } }, { - "id": "minimax/minimax-m2", - "name": "MiniMax M2", - "display_name": "MiniMax M2", + "id": "mistral-large-latest", + "name": "Mistral Large", + "display_name": "Mistral Large", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 205000, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2025-12-02", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.38 - }, - "type": "chat" + "input": 0.5, + "output": 1.5 + } }, { - "id": "google/gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "mistral-medium-latest", + "name": "Mistral Medium", + "display_name": "Mistral Medium", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-10", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } - }, - "type": "chat" + "input": 0.4, + "output": 2 + } }, { - "id": "google/gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash Lite", - "display_name": "Gemini 2.5 Flash Lite", + "id": "mistral-large-2411", + "name": "Mistral Large 2.1", + "display_name": "Mistral Large 2.1", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "attachment": false, + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2024-11-04", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 - }, - "type": "chat" + "input": 2, + "output": 6 + } }, { - "id": "google/gemini-2.5-flash-preview-09-2025", - "name": "Gemini 2.5 Flash Preview 09-25", - "display_name": "Gemini 2.5 Flash Preview 09-25", + "id": "magistral-medium-latest", + "name": "Magistral Medium", + "display_name": "Magistral Medium", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -11927,97 +11702,90 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "attachment": false, + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2025-03-17", + "last_updated": "2025-03-20", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.383 - }, - "type": "chat" - }, + "input": 2, + "output": 5 + } + } + ] + }, + "abacus": { + "id": "abacus", + "name": "Abacus", + "display_name": "Abacus", + "api": "https://routellm.abacus.ai/v1", + "doc": "https://abacus.ai/help/api", + "models": [ { - "id": "google/gemini-2.5-flash-lite-preview-09-2025", - "name": "Gemini 2.5 Flash Lite Preview 09-25", - "display_name": "Gemini 2.5 Flash Lite Preview 09-25", + "id": "gpt-4.1-nano", + "name": "GPT-4.1 Nano", + "display_name": "GPT-4.1 Nano", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { "input": 0.1, - "output": 0.4, - "cache_read": 0.025 - }, - "type": "chat" + "output": 0.4 + } }, { - "id": "google/gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "grok-4-fast-non-reasoning", + "name": "Grok 4 Fast (Non-Reasoning)", + "display_name": "Grok 4 Fast (Non-Reasoning)", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 2000000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 - }, - "type": "chat" + "input": 0.2, + "output": 0.5 + } }, { - "id": "google/gemini-2.0-flash", + "id": "gemini-2.0-flash-001", "name": "Gemini 2.0 Flash", "display_name": "Gemini 2.0 Flash", "modalities": { @@ -12025,15 +11793,14 @@ "text", "image", "audio", - "video", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 1000000, "output": 8192 }, "temperature": true, @@ -12043,20 +11810,17 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "release_date": "2025-02-05", + "last_updated": "2025-02-05", "cost": { "input": 0.1, - "output": 0.4, - "cache_read": 0.025 - }, - "type": "chat" + "output": 0.4 + } }, { - "id": "google/gemini-2.0-flash-lite", - "name": "Gemini 2.0 Flash Lite", - "display_name": "Gemini 2.0 Flash Lite", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ "text", @@ -12071,99 +11835,91 @@ }, "limit": { "context": 1048576, - "output": 8192 + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.075, - "output": 0.3 - }, - "type": "chat" + "input": 0.5, + "output": 3 + } }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "route-llm", + "name": "Route LLM", + "display_name": "Route LLM", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2024-10", + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "input_audio": 1 - }, - "type": "chat" + "input": 0.5, + "output": 1.5 + } }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "grok-code-fast-1", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": true, + "open_weights": false, + "release_date": "2025-09-01", + "last_updated": "2025-09-01", "cost": { - "input": 0.07, - "output": 0.3 - }, - "type": "chat" + "input": 0.2, + "output": 1.5 + } }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "kimi-k2-turbo-preview", + "name": "Kimi K2 Turbo Preview", + "display_name": "Kimi K2 Turbo Preview", "modalities": { "input": [ "text" @@ -12173,43 +11929,43 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "release_date": "2025-07-08", + "last_updated": "2025-07-08", "cost": { - "input": 0.1, - "output": 0.5 - }, - "type": "chat" + "input": 0.15, + "output": 8 + } }, { - "id": "openai/gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 65000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -12217,54 +11973,53 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 - }, - "type": "chat" + "input": 2, + "output": 12 + } }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 - }, - "type": "chat" + "input": 0.3, + "output": 2.5 + } }, { - "id": "openai/o3", - "name": "o3", - "display_name": "o3", + "id": "gpt-4.1-mini", + "name": "GPT-4.1 Mini", + "display_name": "GPT-4.1 Mini", "modalities": { "input": [ "text", @@ -12275,45 +12030,43 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1047576, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 - }, - "type": "chat" + "input": 0.4, + "output": 1.6 + } }, { - "id": "openai/gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "claude-opus-4-5-20251101", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -12321,55 +12074,82 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-03-31", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.03 - }, - "type": "chat" + "input": 5, + "output": 25 + } }, { - "id": "openai/o1", - "name": "o1", - "display_name": "o1", + "id": "qwen-2.5-coder-32b", + "name": "Qwen 2.5 Coder 32B", + "display_name": "Qwen 2.5 Coder 32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "attachment": false, + "open_weights": true, + "release_date": "2024-11-11", + "last_updated": "2024-11-11", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 - }, - "type": "chat" + "input": 0.79, + "output": 0.79 + } }, { - "id": "openai/o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "claude-sonnet-4-5-20250929", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 64000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "cost": { + "input": 3, + "output": 15 + } + }, + { + "id": "grok-4-0709", + "name": "Grok 4", + "display_name": "Grok 4", "modalities": { "input": [ "text", @@ -12379,6 +12159,37 @@ "text" ] }, + "limit": { + "context": 256000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-07-09", + "last_updated": "2025-07-09", + "cost": { + "input": 3, + "output": 15 + } + }, + { + "id": "o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, "limit": { "context": 200000, "output": 100000 @@ -12389,22 +12200,20 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { "input": 1.1, - "output": 4.4, - "cache_read": 0.28 - }, - "type": "chat" + "output": 4.4 + } }, { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "gpt-5.2-chat-latest", + "name": "GPT-5.2 Chat Latest", + "display_name": "GPT-5.2 Chat Latest", "modalities": { "input": [ "text", @@ -12415,42 +12224,43 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2024-09-30", + "release_date": "2026-01-01", + "last_updated": "2026-01-01", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 - }, - "type": "chat" + "input": 1.5, + "output": 12 + } }, { - "id": "openai/gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "gemini-2.0-pro-exp-02-05", + "name": "Gemini 2.0 Pro Exp", + "display_name": "Gemini 2.0 Pro Exp", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 2000000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -12459,20 +12269,13 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", - "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 - }, - "type": "chat" + "release_date": "2025-02-05", + "last_updated": "2025-02-05" }, { - "id": "openai/gpt-5-codex", - "name": "GPT-5-Codex", - "display_name": "GPT-5-Codex", + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ "text", @@ -12492,20 +12295,18 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { "input": 1.25, - "output": 10, - "cache_read": 0.125 - }, - "type": "chat" + "output": 10 + } }, { - "id": "openai/gpt-5-nano", + "id": "gpt-5-nano", "name": "GPT-5 Nano", "display_name": "GPT-5 Nano", "modalities": { @@ -12534,18 +12335,18 @@ "last_updated": "2025-08-07", "cost": { "input": 0.05, - "output": 0.4, - "cache_read": 0.01 - }, - "type": "chat" + "output": 0.4 + } }, { - "id": "openai/o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "claude-sonnet-4-20250514", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -12553,30 +12354,27 @@ }, "limit": { "context": 200000, - "output": 100000 + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "release_date": "2025-05-14", + "last_updated": "2025-05-14", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 - }, - "type": "chat" + "input": 3, + "output": 15 + } }, { - "id": "openai/gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ "text", @@ -12587,8 +12385,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -12597,19 +12395,18 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 10, - "output": 30 - }, - "type": "chat" + "input": 2, + "output": 8 + } }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ "text", @@ -12620,97 +12417,95 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 - }, - "type": "chat" + "input": 1.1, + "output": 4.4 + } }, { - "id": "openai/gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", + "id": "claude-opus-4-20250514", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2025-05-14", + "last_updated": "2025-05-14", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.03 - }, - "type": "chat" + "input": 15, + "output": 75 + } }, { - "id": "perplexity/sonar-reasoning", - "name": "Sonar Reasoning", - "display_name": "Sonar Reasoning", + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 127000, - "output": 8000 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 1, - "output": 5 - }, - "type": "chat" + "input": 0.25, + "output": 2 + } }, { - "id": "perplexity/sonar", - "name": "Sonar", - "display_name": "Sonar", + "id": "o3-pro", + "name": "o3-pro", + "display_name": "o3-pro", "modalities": { "input": [ "text", @@ -12721,33 +12516,34 @@ ] }, "limit": { - "context": 127000, - "output": 8000 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-02", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "knowledge": "2024-05", + "release_date": "2025-06-10", + "last_updated": "2025-06-10", "cost": { - "input": 1, - "output": 1 - }, - "type": "chat" + "input": 20, + "output": 80 + } }, { - "id": "perplexity/sonar-pro", - "name": "Sonar Pro", - "display_name": "Sonar Pro", + "id": "claude-3-7-sonnet-20250219", + "name": "Claude Sonnet 3.7", + "display_name": "Claude Sonnet 3.7", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -12755,64 +12551,69 @@ }, "limit": { "context": 200000, - "output": 8000 + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-09", + "knowledge": "2024-10-31", "release_date": "2025-02-19", "last_updated": "2025-02-19", "cost": { "input": 3, "output": 15 - }, - "type": "chat" + } }, { - "id": "perplexity/sonar-reasoning-pro", - "name": "Sonar Reasoning Pro", - "display_name": "Sonar Reasoning Pro", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 127000, - "output": 8000 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "knowledge": "2025-01", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 2, - "output": 8 - }, - "type": "chat" + "input": 1.25, + "output": 10 + } }, { - "id": "zai/glm-4.5", - "name": "GLM 4.5", - "display_name": "GLM 4.5", + "id": "gpt-4o-2024-11-20", + "name": "GPT-4o (2024-11-20)", + "display_name": "GPT-4o (2024-11-20)", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" @@ -12820,62 +12621,60 @@ }, "limit": { "context": 128000, - "output": 96000 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-11-20", + "last_updated": "2024-11-20", "cost": { - "input": 0.6, - "output": 2.2 - }, - "type": "chat" + "input": 2.5, + "output": 10 + } }, { - "id": "zai/glm-4.5-air", - "name": "GLM 4.5 Air", - "display_name": "GLM 4.5 Air", + "id": "o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 96000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.2, - "output": 1.1 - }, - "type": "chat" + "input": 2, + "output": 8 + } }, { - "id": "zai/glm-4.5v", - "name": "GLM 4.5V", - "display_name": "GLM 4.5V", + "id": "gpt-4o-mini", + "name": "GPT-4o Mini", + "display_name": "GPT-4o Mini", "modalities": { "input": [ "text", @@ -12886,30 +12685,28 @@ ] }, "limit": { - "context": 66000, - "output": 16000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.6, - "output": 1.8 - }, - "type": "chat" + "input": 0.15, + "output": 0.6 + } }, { - "id": "zai/glm-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ "text" @@ -12919,8 +12716,8 @@ ] }, "limit": { - "context": 200000, - "output": 96000 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -12929,66 +12726,63 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "open_weights": false, + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.6, - "output": 2.2 - }, - "type": "chat" + "input": 1.2, + "output": 6 + } }, { - "id": "amazon/nova-micro", - "name": "Nova Micro", - "display_name": "Nova Micro", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.035, - "output": 0.14, - "cache_read": 0.00875 - }, - "type": "chat" + "input": 1.25, + "output": 10 + } }, { - "id": "amazon/nova-pro", - "name": "Nova Pro", - "display_name": "Nova Pro", + "id": "grok-4-1-fast-non-reasoning", + "name": "Grok 4.1 Fast (Non-Reasoning)", + "display_name": "Grok 4.1 Fast (Non-Reasoning)", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 300000, - "output": 8192 + "context": 2000000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -12997,117 +12791,113 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "release_date": "2025-11-17", + "last_updated": "2025-11-17", "cost": { - "input": 0.8, - "output": 3.2, - "cache_read": 0.2 - }, - "type": "chat" + "input": 0.2, + "output": 0.5 + } }, { - "id": "amazon/nova-lite", - "name": "Nova Lite", - "display_name": "Nova Lite", + "id": "llama-3.3-70b-versatile", + "name": "Llama 3.3 70B Versatile", + "display_name": "Llama 3.3 70B Versatile", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 300000, - "output": 8192 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "attachment": false, + "open_weights": true, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.06, - "output": 0.24, - "cache_read": 0.015 - }, - "type": "chat" + "input": 0.59, + "output": 0.79 + } }, { - "id": "morph/morph-v3-fast", - "name": "Morph v3 Fast", - "display_name": "Morph v3 Fast", + "id": "claude-opus-4-1-20250805", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 16000 + "context": 200000, + "output": 32000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.8, - "output": 1.2 - }, - "type": "chat" + "input": 15, + "output": 75 + } }, { - "id": "morph/morph-v3-large", - "name": "Morph v3 Large", - "display_name": "Morph v3 Large", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 400000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.9, - "output": 1.9 - }, - "type": "chat" + "input": 1.75, + "output": 14 + } }, { - "id": "meta/llama-4-scout", - "name": "Llama-4-Scout-17B-16E-Instruct-FP8", - "display_name": "Llama-4-Scout-17B-16E-Instruct-FP8", + "id": "gpt-5.1-chat-latest", + "name": "GPT-5.1 Chat Latest", + "display_name": "GPT-5.1 Chat Latest", "modalities": { "input": [ "text", @@ -13118,65 +12908,66 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 1.25, + "output": 10 + } }, { - "id": "meta/llama-3.3-70b", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "claude-haiku-4-5-20251001", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 1, + "output": 5 + } }, { - "id": "meta/llama-4-maverick", - "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", - "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "id": "deepseek/deepseek-v3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -13184,41 +12975,39 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.14, + "output": 0.28 + } }, { - "id": "anthropic/claude-haiku-4.5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "openai/gpt-oss-120b", + "name": "GPT-OSS 120B", + "display_name": "GPT-OSS 120B", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -13227,255 +13016,212 @@ "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1, - "output": 1.25, - "cache_read": 0.1, - "cache_write": 1.25 - }, - "type": "chat" + "input": 0.08, + "output": 0.44 + } }, { - "id": "anthropic/claude-opus-4.5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "meta-llama/Meta-Llama-3.1-8B-Instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 5, - "output": 25, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" + "input": 0.02, + "output": 0.05 + } }, { - "id": "anthropic/claude-3.5-haiku", - "name": "Claude Haiku 3.5", - "display_name": "Claude Haiku 3.5", + "id": "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo", + "name": "Llama 3.1 405B Instruct Turbo", + "display_name": "Llama 3.1 405B Instruct Turbo", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 - }, - "type": "chat" + "input": 3.5, + "output": 3.5 + } }, { - "id": "anthropic/claude-3.7-sonnet", - "name": "Claude Sonnet 3.7", - "display_name": "Claude Sonnet 3.7", + "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", + "name": "Llama 4 Maverick 17B 128E Instruct FP8", + "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0.14, + "output": 0.59 + } }, { - "id": "anthropic/claude-4.5-sonnet", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "meta-llama/Meta-Llama-3.1-70B-Instruct", + "name": "Llama 3.1 70B Instruct", + "display_name": "Llama 3.1 70B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0.4, + "output": 0.4 + } }, { - "id": "anthropic/claude-3.5-sonnet", - "name": "Claude Sonnet 3.5 v2", - "display_name": "Claude Sonnet 3.5 v2", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct", + "display_name": "Qwen3 235B A22B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 262144, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "attachment": false, + "open_weights": true, + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0.13, + "output": 0.6 + } }, { - "id": "anthropic/claude-4-1-opus", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "Qwen/Qwen2.5-72B-Instruct", + "name": "Qwen 2.5 72B Instruct", + "display_name": "Qwen 2.5 72B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "release_date": "2024-09-19", + "last_updated": "2024-09-19", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" + "input": 0.11, + "output": 0.38 + } }, { - "id": "anthropic/claude-4-sonnet", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "Qwen/QwQ-32B", + "name": "QwQ 32B", + "display_name": "QwQ 32B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -13483,141 +13229,111 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "release_date": "2024-11-28", + "last_updated": "2024-11-28", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0.4, + "output": 0.4 + } }, { - "id": "anthropic/claude-3-opus", - "name": "Claude Opus 3", - "display_name": "Claude Opus 3", + "id": "Qwen/Qwen3-32B", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-02-29", - "last_updated": "2024-02-29", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" + "input": 0.09, + "output": 0.29 + } }, { - "id": "anthropic/claude-3-haiku", - "name": "Claude Haiku 3", - "display_name": "Claude Haiku 3", + "id": "Qwen/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-13", - "last_updated": "2024-03-13", + "attachment": false, + "open_weights": true, + "release_date": "2025-07-22", + "last_updated": "2025-07-22", "cost": { - "input": 0.25, - "output": 1.25, - "cache_read": 0.03, - "cache_write": 0.3 - }, - "type": "chat" + "input": 0.29, + "output": 1.2 + } }, { - "id": "anthropic/claude-4-opus", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "zai-org/glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" - } - ] - }, - "nebius": { - "id": "nebius", - "name": "Nebius Token Factory", - "display_name": "Nebius Token Factory", - "api": "https://api.tokenfactory.nebius.com/v1", - "doc": "https://docs.tokenfactory.nebius.com/", - "models": [ + "input": 0.7, + "output": 2.5 + } + }, { - "id": "NousResearch/hermes-4-70b", - "name": "Hermes 4 70B", - "display_name": "Hermes 4 70B", + "id": "zai-org/glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ "text" @@ -13627,7 +13343,7 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, "temperature": true, @@ -13637,20 +13353,18 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-08-01", - "last_updated": "2025-10-04", + "open_weights": true, + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.13, - "output": 0.4 - }, - "type": "chat" + "input": 0.6, + "output": 2.2 + } }, { - "id": "NousResearch/hermes-4-405b", - "name": "Hermes-4 405B", - "display_name": "Hermes-4 405B", + "id": "zai-org/glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" @@ -13660,30 +13374,27 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-08-01", - "last_updated": "2025-10-04", + "open_weights": true, + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { - "input": 1, - "output": 3 - }, - "type": "chat" + "input": 0.6, + "output": 2.2 + } }, { - "id": "moonshotai/kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "deepseek-ai/DeepSeek-R1", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", "modalities": { "input": [ "text" @@ -13693,7 +13404,7 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, "temperature": true, @@ -13703,20 +13414,18 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-01", - "release_date": "2025-01-01", - "last_updated": "2025-10-04", + "open_weights": true, + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.5, - "output": 2.4 - }, - "type": "chat" + "input": 3, + "output": 7 + } }, { - "id": "nvidia/llama-3_1-nemotron-ultra-253b-v1", - "name": "Llama 3.1 Nemotron Ultra 253B v1", - "display_name": "Llama 3.1 Nemotron Ultra 253B v1", + "id": "deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "DeepSeek V3.1 Terminus", + "display_name": "DeepSeek V3.1 Terminus", "modalities": { "input": [ "text" @@ -13726,7 +13435,7 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, "temperature": true, @@ -13736,20 +13445,18 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-01", - "last_updated": "2025-10-04", + "open_weights": true, + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "cost": { - "input": 0.6, - "output": 1.8 - }, - "type": "chat" + "input": 0.27, + "output": 1 + } }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -13759,7 +13466,7 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, "temperature": true, @@ -13768,21 +13475,27 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-01", - "release_date": "2024-01-01", - "last_updated": "2025-10-04", + "attachment": false, + "open_weights": true, + "release_date": "2025-06-15", + "last_updated": "2025-06-15", "cost": { - "input": 0.05, - "output": 0.2 - }, - "type": "chat" - }, + "input": 0.27, + "output": 0.4 + } + } + ] + }, + "vercel": { + "id": "vercel", + "name": "Vercel AI Gateway", + "display_name": "Vercel AI Gateway", + "doc": "https://github.com/vercel/ai/tree/5eb85cc45a259553501f535b8ac79a77d0e79223/packages/gateway", + "models": [ { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "moonshotai/kimi-k2-thinking-turbo", + "name": "Kimi K2 Thinking Turbo", + "display_name": "Kimi K2 Thinking Turbo", "modalities": { "input": [ "text" @@ -13792,8 +13505,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262114, + "output": 262114 }, "temperature": true, "tool_call": true, @@ -13801,21 +13514,21 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-01", - "release_date": "2024-01-01", - "last_updated": "2025-10-04", + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.15, - "output": 0.6 - }, - "type": "chat" + "input": 1.15, + "output": 8, + "cache_read": 0.15 + } }, { - "id": "qwen/qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "moonshotai/kimi-k2-turbo", + "name": "Kimi K2 Turbo", + "display_name": "Kimi K2 Turbo", "modalities": { "input": [ "text" @@ -13825,33 +13538,33 @@ ] }, "limit": { - "context": 262144, - "output": 8192 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-25", - "last_updated": "2025-10-04", + "knowledge": "2024-08", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.2, - "output": 0.6 - }, - "type": "chat" + "input": 2.4, + "output": 10 + } }, { - "id": "qwen/qwen3-235b-a22b-thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -13859,7 +13572,7 @@ }, "limit": { "context": 262144, - "output": 8192 + "output": 262144 }, "temperature": true, "tool_call": true, @@ -13867,21 +13580,20 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-25", - "last_updated": "2025-10-04", + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-26", + "last_updated": "2026-01-26", "cost": { - "input": 0.2, - "output": 0.8 - }, - "type": "chat" + "input": 0.6, + "output": 1.2 + } }, { - "id": "qwen/qwen3-coder-480b-a35b-instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "moonshotai/kimi-k2-0905", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ "text" @@ -13891,29 +13603,28 @@ ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 131072, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-10-04", + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.4, - "output": 1.8 - }, - "type": "chat" + "input": 0.6, + "output": 2.5 + } }, { - "id": "meta-llama/llama-3_1-405b-instruct", - "name": "Llama 3.1 405B Instruct", - "display_name": "Llama 3.1 405B Instruct", + "id": "moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -13923,8 +13634,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 216144, + "output": 216144 }, "temperature": true, "tool_call": true, @@ -13934,19 +13645,19 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-07-23", - "last_updated": "2025-10-04", + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 1, - "output": 3 - }, - "type": "chat" + "input": 0.47, + "output": 2, + "cache_read": 0.14 + } }, { - "id": "meta-llama/llama-3.3-70b-instruct-fast", - "name": "Llama-3.3-70B-Instruct (Fast)", - "display_name": "Llama-3.3-70B-Instruct (Fast)", + "id": "moonshotai/kimi-k2", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ "text" @@ -13957,29 +13668,27 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-22", - "last_updated": "2025-10-04", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-14", + "last_updated": "2025-07-14", "cost": { - "input": 0.25, - "output": 0.75 - }, - "type": "chat" + "input": 1, + "output": 3 + } }, { - "id": "meta-llama/llama-3.3-70b-instruct-base", - "name": "Llama-3.3-70B-Instruct (Base)", - "display_name": "Llama-3.3-70B-Instruct (Base)", + "id": "xiaomi/mimo-v2-flash", + "name": "MiMo V2 Flash", + "display_name": "MiMo V2 Flash", "modalities": { "input": [ "text" @@ -13989,8 +13698,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -14000,19 +13709,18 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-22", - "last_updated": "2025-10-04", + "knowledge": "2024-10", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.13, - "output": 0.4 - }, - "type": "chat" + "input": 0.1, + "output": 0.29 + } }, { - "id": "zai-org/glm-4.5", - "name": "GLM 4.5", - "display_name": "GLM 4.5", + "id": "alibaba/qwen3-coder", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" @@ -14022,30 +13730,28 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 66536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-06-01", - "last_updated": "2025-10-04", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.6, - "output": 2.2 - }, - "type": "chat" + "input": 0.38, + "output": 1.53 + } }, { - "id": "zai-org/glm-4.5-air", - "name": "GLM 4.5 Air", - "display_name": "GLM 4.5 Air", + "id": "alibaba/qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ "text" @@ -14055,30 +13761,28 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-06-01", - "last_updated": "2025-10-04", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-12", + "last_updated": "2025-09-12", "cost": { - "input": 0.2, - "output": 1.2 - }, - "type": "chat" + "input": 0.09, + "output": 1.1 + } }, { - "id": "deepseek-ai/deepseek-v3", - "name": "DeepSeek V3", - "display_name": "DeepSeek V3", + "id": "alibaba/qwen-3-32b", + "name": "Qwen 3.32B", + "display_name": "Qwen 3.32B", "modalities": { "input": [ "text" @@ -14088,8 +13792,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 40960, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -14099,39 +13803,30 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-05-07", - "last_updated": "2025-10-04", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.5, - "output": 1.5 - }, - "type": "chat" - } - ] - }, - "deepseek": { - "id": "deepseek", - "name": "DeepSeek", - "display_name": "DeepSeek", - "api": "https://api.deepseek.com", - "doc": "https://platform.deepseek.com/api-docs/pricing", - "models": [ + "input": 0.1, + "output": 0.3 + } + }, { - "id": "deepseek-chat", - "name": "DeepSeek Chat", - "display_name": "DeepSeek Chat", + "id": "alibaba/qwen3-vl-instruct", + "name": "Qwen3 VL Instruct", + "display_name": "Qwen3 VL Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 129024 }, "temperature": true, "tool_call": true, @@ -14139,21 +13834,19 @@ "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-12-26", - "last_updated": "2025-08-21", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 0.57, - "output": 1.68, - "cache_read": 0.07 - }, - "type": "chat" + "input": 0.7, + "output": 2.8 + } }, { - "id": "deepseek-reasoner", - "name": "DeepSeek Reasoner", - "display_name": "DeepSeek Reasoner", + "id": "alibaba/qwen-3-235b", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -14163,40 +13856,28 @@ ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 40960, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-08-21", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.57, - "output": 1.68, - "cache_read": 0.07 - }, - "type": "chat" - } - ] - }, - "alibaba-cn": { - "id": "alibaba-cn", - "name": "alibaba-cn", - "display_name": "alibaba-cn", - "api": "https://dashscope.aliyuncs.com/compatible-mode/v1", - "doc": "https://www.alibabacloud.com/help/en/model-studio/models", - "models": [ + "input": 0.13, + "output": 0.6 + } + }, { - "id": "deepseek-r1-distill-qwen-7b", - "name": "DeepSeek R1 Distill Qwen 7B", - "display_name": "DeepSeek R1 Distill Qwen 7B", + "id": "alibaba/qwen-3-14b", + "name": "Qwen3-14B", + "display_name": "Qwen3-14B", "modalities": { "input": [ "text" @@ -14206,7 +13887,7 @@ ] }, "limit": { - "context": 32768, + "context": 40960, "output": 16384 }, "temperature": true, @@ -14217,29 +13898,29 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.072, - "output": 0.144 - }, - "type": "chat" + "input": 0.06, + "output": 0.24 + } }, { - "id": "qwen3-asr-flash", - "name": "Qwen3-ASR Flash", - "display_name": "Qwen3-ASR Flash", + "id": "alibaba/qwen3-embedding-4b", + "name": "Qwen3 Embedding 4B", + "display_name": "Qwen3 Embedding 4B", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 53248, - "output": 4096 + "context": 32768, + "output": 32768 }, "temperature": false, "tool_call": false, @@ -14248,19 +13929,17 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-08", - "last_updated": "2025-09-08", + "release_date": "2025-06-05", + "last_updated": "2025-06-05", "cost": { - "input": 0.032, - "output": 0.032 - }, - "type": "chat" + "input": 0.02, + "output": 0 + } }, { - "id": "deepseek-r1-0528", - "name": "DeepSeek R1 0528", - "display_name": "DeepSeek R1 0528", + "id": "alibaba/qwen3-max-thinking", + "name": "Qwen 3 Max Thinking", + "display_name": "Qwen 3 Max Thinking", "modalities": { "input": [ "text" @@ -14270,8 +13949,8 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 256000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -14280,19 +13959,54 @@ "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-01", + "last_updated": "2025-01", "cost": { - "input": 0.574, - "output": 2.294 + "input": 1.2, + "output": 6, + "cache_read": 0.24 + } + }, + { + "id": "alibaba/qwen3-235b-a22b-thinking", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] }, - "type": "chat" + "limit": { + "context": 262114, + "output": 262114 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", + "cost": { + "input": 0.3, + "output": 2.9 + } }, { - "id": "deepseek-v3", - "name": "DeepSeek V3", - "display_name": "DeepSeek V3", + "id": "alibaba/qwen-3-30b", + "name": "Qwen3-30B-A3B", + "display_name": "Qwen3-30B-A3B", "modalities": { "input": [ "text" @@ -14302,66 +14016,59 @@ ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 40960, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.287, - "output": 1.147 - }, - "type": "chat" + "input": 0.08, + "output": 0.29 + } }, { - "id": "qwen-omni-turbo", - "name": "Qwen-Omni Turbo", - "display_name": "Qwen-Omni Turbo", + "id": "alibaba/qwen3-embedding-0.6b", + "name": "Qwen3 Embedding 0.6B", + "display_name": "Qwen3 Embedding 0.6B", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { "context": 32768, - "output": 2048 + "output": 32768 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-19", - "last_updated": "2025-03-26", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 0.058, - "output": 0.23, - "input_audio": 3.584, - "output_audio": 7.168 - }, - "type": "chat" + "input": 0.01, + "output": 0 + } }, { - "id": "qwen-vl-max", - "name": "Qwen-VL Max", - "display_name": "Qwen-VL Max", + "id": "alibaba/qwen3-vl-thinking", + "name": "Qwen3 VL Thinking", + "display_name": "Qwen3 VL Thinking", "modalities": { "input": [ "text", @@ -14373,28 +14080,28 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 129024 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-04-08", - "last_updated": "2025-08-13", + "attachment": true, + "open_weights": true, + "knowledge": "2025-09", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 0.23, - "output": 0.574 - }, - "type": "chat" + "input": 0.7, + "output": 8.4 + } }, { - "id": "deepseek-v3-2-exp", - "name": "DeepSeek V3.2 Exp", - "display_name": "DeepSeek V3.2 Exp", + "id": "alibaba/qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ "text" @@ -14404,8 +14111,8 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -14414,18 +14121,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.287, - "output": 0.431 - }, - "type": "chat" + "input": 1.2, + "output": 6 + } }, { - "id": "qwen3-next-80b-a3b-instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "alibaba/qwen3-embedding-8b", + "name": "Qwen3 Embedding 8B", + "display_name": "Qwen3 Embedding 8B", "modalities": { "input": [ "text" @@ -14435,29 +14142,27 @@ ] }, "limit": { - "context": 131072, + "context": 32768, "output": 32768 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09", - "last_updated": "2025-09", + "open_weights": false, + "release_date": "2025-06-05", + "last_updated": "2025-06-05", "cost": { - "input": 0.144, - "output": 0.574 - }, - "type": "chat" + "input": 0.05, + "output": 0 + } }, { - "id": "deepseek-r1", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", + "id": "alibaba/qwen3-max-preview", + "name": "Qwen3 Max Preview", + "display_name": "Qwen3 Max Preview", "modalities": { "input": [ "text" @@ -14467,29 +14172,29 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.574, - "output": 2.294 - }, - "type": "chat" + "input": 1.2, + "output": 6, + "cache_read": 0.24 + } }, { - "id": "qwen-turbo", - "name": "Qwen Turbo", - "display_name": "Qwen Turbo", + "id": "alibaba/qwen3-coder-plus", + "name": "Qwen3 Coder Plus", + "display_name": "Qwen3 Coder Plus", "modalities": { "input": [ "text" @@ -14499,46 +14204,31 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1000000, + "output": 1000000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-11-01", - "last_updated": "2025-07-15", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.044, - "output": 0.087, - "reasoning": 0.431 - }, - "type": "chat" + "input": 1, + "output": 5 + } }, { - "id": "qwen3-vl-235b-a22b", - "name": "Qwen3-VL 235B-A22B", - "display_name": "Qwen3-VL 235B-A22B", + "id": "alibaba/qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -14546,7 +14236,7 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 65536 }, "temperature": true, "tool_call": true, @@ -14556,20 +14246,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "knowledge": "2025-09", + "release_date": "2025-09-12", + "last_updated": "2025-09-12", "cost": { - "input": 0.286705, - "output": 1.14682, - "reasoning": 2.867051 - }, - "type": "chat" + "input": 0.15, + "output": 1.5 + } }, { - "id": "qwen3-coder-flash", - "name": "Qwen3 Coder Flash", - "display_name": "Qwen3 Coder Flash", + "id": "alibaba/qwen3-coder-30b-a3b", + "name": "Qwen 3 Coder 30B A3B Instruct", + "display_name": "Qwen 3 Coder 30B A3B Instruct", "modalities": { "input": [ "text" @@ -14579,41 +14267,40 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 160000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.144, - "output": 0.574 - }, - "type": "chat" + "input": 0.07, + "output": 0.27 + } }, { - "id": "qwen3-vl-30b-a3b", - "name": "Qwen3-VL 30B-A3B", - "display_name": "Qwen3-VL 30B-A3B", + "id": "meituan/longcat-flash-thinking", + "name": "LongCat Flash Thinking", + "display_name": "LongCat Flash Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -14622,21 +14309,19 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.108, - "output": 0.431, - "reasoning": 1.076 - }, - "type": "chat" + "input": 0.15, + "output": 1.5 + } }, { - "id": "qwen3-14b", - "name": "Qwen3 14B", - "display_name": "Qwen3 14B", + "id": "meituan/longcat-flash-chat", + "name": "LongCat Flash Chat", + "display_name": "LongCat Flash Chat", "modalities": { "input": [ "text" @@ -14646,48 +14331,35 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", - "cost": { - "input": 0.144, - "output": 0.574, - "reasoning": 1.434 - }, - "type": "chat" + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-08-30", + "last_updated": "2025-08-30" }, { - "id": "qvq-max", - "name": "QVQ Max", - "display_name": "QVQ Max", + "id": "xai/grok-4-fast-reasoning", + "name": "Grok 4 Fast Reasoning", + "display_name": "Grok 4 Fast Reasoning", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 2000000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -14697,19 +14369,19 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "knowledge": "2024-10", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 1.147, - "output": 4.588 - }, - "type": "chat" + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + } }, { - "id": "deepseek-r1-distill-qwen-32b", - "name": "DeepSeek R1 Distill Qwen 32B", - "display_name": "DeepSeek R1 Distill Qwen 32B", + "id": "xai/grok-4.1-fast-reasoning", + "name": "Grok 4.1 Fast Reasoning", + "display_name": "Grok 4.1 Fast Reasoning", "modalities": { "input": [ "text" @@ -14719,8 +14391,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -14730,18 +14402,19 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2024-10", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.287, - "output": 0.861 - }, - "type": "chat" + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + } }, { - "id": "qwen-plus-character", - "name": "Qwen Plus Character", - "display_name": "Qwen Plus Character", + "id": "xai/grok-4.1-fast-non-reasoning", + "name": "Grok 4.1 Fast Non-Reasoning", + "display_name": "Grok 4.1 Fast Non-Reasoning", "modalities": { "input": [ "text" @@ -14751,8 +14424,8 @@ ] }, "limit": { - "context": 32768, - "output": 4096 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -14761,19 +14434,19 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01", - "last_updated": "2024-01", + "knowledge": "2024-10", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.115, - "output": 0.287 - }, - "type": "chat" + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + } }, { - "id": "qwen2-5-14b-instruct", - "name": "Qwen2.5 14B Instruct", - "display_name": "Qwen2.5 14B Instruct", + "id": "xai/grok-3-mini-fast", + "name": "Grok 3 Mini Fast", + "display_name": "Grok 3 Mini Fast", "modalities": { "input": [ "text" @@ -14789,23 +14462,25 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 0.144, - "output": 0.431 - }, - "type": "chat" + "input": 0.6, + "output": 4, + "reasoning": 4, + "cache_read": 0.15 + } }, { - "id": "qwq-plus", - "name": "QwQ Plus", - "display_name": "QwQ Plus", + "id": "xai/grok-3-mini", + "name": "Grok 3 Mini", + "display_name": "Grok 3 Mini", "modalities": { "input": [ "text" @@ -14819,37 +14494,27 @@ "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 32768, - "min": 0, - "max": 32768 - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-03-05", - "last_updated": "2025-03-05", + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 0.23, - "output": 0.574 - }, - "type": "chat" + "input": 0.3, + "output": 0.5, + "reasoning": 0.5, + "cache_read": 0.075 + } }, { - "id": "qwen2-5-coder-32b-instruct", - "name": "Qwen2.5-Coder 32B Instruct", - "display_name": "Qwen2.5-Coder 32B Instruct", + "id": "xai/grok-3", + "name": "Grok 3", + "display_name": "Grok 3", "modalities": { "input": [ "text" @@ -14868,20 +14533,20 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-11", - "last_updated": "2024-11", + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 0.287, - "output": 0.861 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.75 + } }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3-Coder 30B-A3B Instruct", - "display_name": "Qwen3-Coder 30B-A3B Instruct", + "id": "xai/grok-code-fast-1", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ "text" @@ -14891,94 +14556,97 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 256000, + "output": 10000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": false, + "knowledge": "2023-10", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 0.216, - "output": 0.861 - }, - "type": "chat" + "input": 0.2, + "output": 1.5, + "cache_read": 0.02 + } }, { - "id": "qwen-math-plus", - "name": "Qwen Math Plus", - "display_name": "Qwen Math Plus", + "id": "xai/grok-2-vision", + "name": "Grok 2 Vision", + "display_name": "Grok 2 Vision", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 3072 + "context": 8192, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-08-16", - "last_updated": "2024-09-19", + "knowledge": "2024-08", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.574, - "output": 1.721 - }, - "type": "chat" + "input": 2, + "output": 10, + "cache_read": 2 + } }, { - "id": "qwen-vl-ocr", - "name": "Qwen Vl Ocr", - "display_name": "Qwen Vl Ocr", + "id": "xai/grok-4", + "name": "Grok 4", + "display_name": "Grok 4", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 34096, - "output": 4096 + "context": 256000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-10-28", - "last_updated": "2025-04-13", + "knowledge": "2025-07", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.717, - "output": 0.717 - }, - "type": "chat" + "input": 3, + "output": 15, + "reasoning": 15, + "cache_read": 0.75 + } }, { - "id": "qwen-doc-turbo", - "name": "Qwen Doc Turbo", - "display_name": "Qwen Doc Turbo", + "id": "xai/grok-3-fast", + "name": "Grok 3 Fast", + "display_name": "Grok 3 Fast", "modalities": { "input": [ "text" @@ -14998,51 +14666,52 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01", - "last_updated": "2024-01", + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 0.087, - "output": 0.144 - }, - "type": "chat" + "input": 5, + "output": 25, + "cache_read": 1.25 + } }, { - "id": "qwen-deep-research", - "name": "Qwen Deep Research", - "display_name": "Qwen Deep Research", + "id": "xai/grok-4-fast-non-reasoning", + "name": "Grok 4 Fast (Non-Reasoning)", + "display_name": "Grok 4 Fast (Non-Reasoning)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01", - "last_updated": "2024-01", + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 7.742, - "output": 23.367 - }, - "type": "chat" + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + } }, { - "id": "qwen2-5-72b-instruct", - "name": "Qwen2.5 72B Instruct", - "display_name": "Qwen2.5 72B Instruct", + "id": "nvidia/nemotron-nano-9b-v2", + "name": "Nvidia Nemotron Nano 9B V2", + "display_name": "Nvidia Nemotron Nano 9B V2", "modalities": { "input": [ "text" @@ -15053,43 +14722,40 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-08-18", + "last_updated": "2025-08-18", "cost": { - "input": 0.574, - "output": 1.721 - }, - "type": "chat" + "input": 0.04, + "output": 0.16 + } }, { - "id": "qwen3-omni-flash", - "name": "Qwen3-Omni Flash", - "display_name": "Qwen3-Omni Flash", + "id": "nvidia/nemotron-nano-12b-v2-vl", + "name": "Nvidia Nemotron Nano 12B V2 VL", + "display_name": "Nvidia Nemotron Nano 12B V2 VL", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -15097,23 +14763,20 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "knowledge": "2024-10", + "release_date": "2024-12", + "last_updated": "2024-12", "cost": { - "input": 0.058, - "output": 0.23, - "input_audio": 3.584, - "output_audio": 7.168 - }, - "type": "chat" + "input": 0.2, + "output": 0.6 + } }, { - "id": "qwen-flash", - "name": "Qwen Flash", - "display_name": "Qwen Flash", + "id": "nvidia/nemotron-3-nano-30b-a3b", + "name": "Nemotron 3 Nano 30B A3B", + "display_name": "Nemotron 3 Nano 30B A3B", "modalities": { "input": [ "text" @@ -15123,41 +14786,29 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2024-10", + "release_date": "2024-12", + "last_updated": "2024-12", "cost": { - "input": 0.022, - "output": 0.216 - }, - "type": "chat" + "input": 0.06, + "output": 0.24 + } }, { - "id": "qwen3-8b", - "name": "Qwen3 8B", - "display_name": "Qwen3 8B", + "id": "cohere/embed-v4.0", + "name": "Embed v4.0", + "display_name": "Embed v4.0", "modalities": { "input": [ "text" @@ -15167,50 +14818,38 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": false, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.072, - "output": 0.287, - "reasoning": 0.717 - }, - "type": "chat" + "input": 0.12, + "output": 0 + } }, { - "id": "qwen3-omni-flash-realtime", - "name": "Qwen3-Omni Flash Realtime", - "display_name": "Qwen3-Omni Flash Realtime", + "id": "cohere/command-a", + "name": "Command A", + "display_name": "Command A", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 256000, + "output": 8000 }, "temperature": true, "tool_call": true, @@ -15219,54 +14858,46 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "knowledge": "2024-10", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 0.23, - "output": 0.918, - "input_audio": 3.584, - "output_audio": 7.168 - }, - "type": "chat" + "input": 2.5, + "output": 10 + } }, { - "id": "qwen2-5-vl-72b-instruct", - "name": "Qwen2.5-VL 72B Instruct", - "display_name": "Qwen2.5-VL 72B Instruct", + "id": "kwaipilot/kat-coder-pro-v1", + "name": "KAT-Coder-Pro V1", + "display_name": "KAT-Coder-Pro V1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", - "cost": { - "input": 2.294, - "output": 6.881 - }, - "type": "chat" + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-10-24", + "last_updated": "2025-10-24" }, { - "id": "qwen3-vl-plus", - "name": "Qwen3 VL Plus", - "display_name": "Qwen3 VL Plus", + "id": "mistral/mistral-medium", + "name": "Mistral Medium 3.1", + "display_name": "Mistral Medium 3.1", "modalities": { "input": [ "text", @@ -15277,36 +14908,28 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "knowledge": "2024-10", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 0.143353, - "output": 1.433525, - "reasoning": 4.300576 - }, - "type": "chat" + "input": 0.4, + "output": 2 + } }, { - "id": "qwen-plus", - "name": "Qwen Plus", - "display_name": "Qwen Plus", + "id": "mistral/codestral-embed", + "name": "Codestral Embed", + "display_name": "Codestral Embed", "modalities": { "input": [ "text" @@ -15316,42 +14939,27 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01-25", - "last_updated": "2025-09-11", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.115, - "output": 0.287, - "reasoning": 1.147 - }, - "type": "chat" + "input": 0.15, + "output": 0 + } }, { - "id": "qwen2-5-32b-instruct", - "name": "Qwen2.5 32B Instruct", - "display_name": "Qwen2.5 32B Instruct", + "id": "mistral/devstral-2", + "name": "Devstral 2", + "display_name": "Devstral 2", "modalities": { "input": [ "text" @@ -15361,8 +14969,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -15370,35 +14978,26 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", - "cost": { - "input": 0.287, - "output": 0.861 - }, - "type": "chat" + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-12-09", + "last_updated": "2025-12-09" }, { - "id": "qwen2-5-omni-7b", - "name": "Qwen2.5-Omni 7B", - "display_name": "Qwen2.5-Omni 7B", + "id": "mistral/devstral-small", + "name": "Devstral Small 1.1", + "display_name": "Devstral Small 1.1", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -15406,59 +15005,51 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-12", - "last_updated": "2024-12", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 0.087, - "output": 0.345, - "input_audio": 5.448 - }, - "type": "chat" + "input": 0.1, + "output": 0.3 + } }, { - "id": "qwen-max", - "name": "Qwen Max", - "display_name": "Qwen Max", + "id": "mistral/mistral-large-3", + "name": "Mistral Large 3", + "display_name": "Mistral Large 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 256000, + "output": 256000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-04-03", - "last_updated": "2025-01-25", + "knowledge": "2024-10", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 0.345, - "output": 1.377 - }, - "type": "chat" + "input": 0.5, + "output": 1.5 + } }, { - "id": "qwen-long", - "name": "Qwen Long", - "display_name": "Qwen Long", + "id": "mistral/mistral-embed", + "name": "Mistral Embed", + "display_name": "Mistral Embed", "modalities": { "input": [ "text" @@ -15468,29 +15059,27 @@ ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 8192, + "output": 1536 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-25", - "last_updated": "2025-01-25", + "release_date": "2023-12-11", + "last_updated": "2023-12-11", "cost": { - "input": 0.072, - "output": 0.287 - }, - "type": "chat" + "input": 0.1, + "output": 0 + } }, { - "id": "qwen2-5-math-72b-instruct", - "name": "Qwen2.5-Math 72B Instruct", - "display_name": "Qwen2.5-Math 72B Instruct", + "id": "mistral/mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text" @@ -15500,8 +15089,8 @@ ] }, "limit": { - "context": 4096, - "output": 3072 + "context": 60288, + "output": 16000 }, "temperature": true, "tool_call": true, @@ -15509,51 +15098,52 @@ "supported": false }, "attachment": false, - "open_weights": true, + "open_weights": false, "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0.574, - "output": 1.721 - }, - "type": "chat" + "input": 0.04, + "output": 0.17 + } }, { - "id": "moonshot-kimi-k2-instruct", - "name": "Moonshot Kimi K2 Instruct", - "display_name": "Moonshot Kimi K2 Instruct", + "id": "mistral/ministral-14b", + "name": "Ministral 14B", + "display_name": "Ministral 14B", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 256000, + "output": 256000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2024-10", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.574, - "output": 2.294 - }, - "type": "chat" + "input": 0.2, + "output": 0.2 + } }, { - "id": "tongyi-intent-detect-v3", - "name": "Tongyi Intent Detect V3", - "display_name": "Tongyi Intent Detect V3", + "id": "mistral/devstral-small-2", + "name": "Devstral Small 2", + "display_name": "Devstral Small 2", "modalities": { "input": [ "text" @@ -15563,29 +15153,24 @@ ] }, "limit": { - "context": 8192, - "output": 1024 + "context": 256000, + "output": 256000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01", - "last_updated": "2024-01", - "cost": { - "input": 0.058, - "output": 0.144 - }, - "type": "chat" + "knowledge": "2024-10", + "release_date": "2025-05-07", + "last_updated": "2025-05-07" }, { - "id": "qwen2-5-7b-instruct", - "name": "Qwen2.5 7B Instruct", - "display_name": "Qwen2.5 7B Instruct", + "id": "mistral/codestral", + "name": "Codestral", + "display_name": "Codestral", "modalities": { "input": [ "text" @@ -15595,8 +15180,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -15605,83 +15190,82 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "knowledge": "2024-10", + "release_date": "2024-05-29", + "last_updated": "2025-01-04", "cost": { - "input": 0.072, - "output": 0.144 - }, - "type": "chat" + "input": 0.3, + "output": 0.9 + } }, { - "id": "qwen2-5-vl-7b-instruct", - "name": "Qwen2.5-VL 7B Instruct", - "display_name": "Qwen2.5-VL 7B Instruct", + "id": "mistral/magistral-medium", + "name": "Magistral Medium", + "display_name": "Magistral Medium", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "knowledge": "2025-06", + "release_date": "2025-03-17", + "last_updated": "2025-03-20", "cost": { - "input": 0.287, - "output": 0.717 - }, - "type": "chat" + "input": 2, + "output": 5 + } }, { - "id": "deepseek-v3-1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "mistral/pixtral-large", + "name": "Pixtral Large", + "display_name": "Pixtral Large", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2024-11-04", "cost": { - "input": 0.574, - "output": 1.721 - }, - "type": "chat" + "input": 2, + "output": 6 + } }, { - "id": "deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "mistral/ministral-8b", + "name": "Ministral 8B", + "display_name": "Ministral 8B", "modalities": { "input": [ "text" @@ -15691,29 +15275,28 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-04", "cost": { - "input": 0.287, - "output": 0.861 - }, - "type": "chat" + "input": 0.1, + "output": 0.1 + } }, { - "id": "qwen3-235b-a22b", - "name": "Qwen3 235B A22B", - "display_name": "Qwen3 235B A22B", + "id": "mistral/ministral-3b", + "name": "Ministral 3B", + "display_name": "Ministral 3B", "modalities": { "input": [ "text" @@ -15723,36 +15306,28 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-04", "cost": { - "input": 0.287, - "output": 1.147, - "reasoning": 2.868 - }, - "type": "chat" + "input": 0.04, + "output": 0.04 + } }, { - "id": "qwen2-5-coder-7b-instruct", - "name": "Qwen2.5-Coder 7B Instruct", - "display_name": "Qwen2.5-Coder 7B Instruct", + "id": "mistral/magistral-small", + "name": "Magistral Small", + "display_name": "Magistral Small", "modalities": { "input": [ "text" @@ -15762,98 +15337,93 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-11", - "last_updated": "2024-11", + "knowledge": "2025-06", + "release_date": "2025-03-17", + "last_updated": "2025-03-17", "cost": { - "input": 0.144, - "output": 0.287 - }, - "type": "chat" + "input": 0.5, + "output": 1.5 + } }, { - "id": "deepseek-r1-distill-qwen-14b", - "name": "DeepSeek R1 Distill Qwen 14B", - "display_name": "DeepSeek R1 Distill Qwen 14B", + "id": "mistral/mistral-small", + "name": "Mistral Small", + "display_name": "Mistral Small", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, + "context": 128000, "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "knowledge": "2025-03", + "release_date": "2024-09-01", + "last_updated": "2024-09-04", "cost": { - "input": 0.144, - "output": 0.431 - }, - "type": "chat" + "input": 0.1, + "output": 0.3 + } }, { - "id": "qwen-omni-turbo-realtime", - "name": "Qwen-Omni Turbo Realtime", - "display_name": "Qwen-Omni Turbo Realtime", + "id": "mistral/pixtral-12b", + "name": "Pixtral 12B", + "display_name": "Pixtral 12B", "modalities": { "input": [ "text", - "image", - "audio" + "image" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-05-08", - "last_updated": "2025-05-08", + "attachment": true, + "open_weights": true, + "knowledge": "2024-09", + "release_date": "2024-09-01", + "last_updated": "2024-09-01", "cost": { - "input": 0.23, - "output": 0.918, - "input_audio": 3.584, - "output_audio": 7.168 - }, - "type": "chat" + "input": 0.15, + "output": 0.15 + } }, { - "id": "qwen-math-turbo", - "name": "Qwen Math Turbo", - "display_name": "Qwen Math Turbo", + "id": "mistral/mixtral-8x22b-instruct", + "name": "Mixtral 8x22B", + "display_name": "Mixtral 8x22B", "modalities": { "input": [ "text" @@ -15863,8 +15433,8 @@ ] }, "limit": { - "context": 4096, - "output": 3072 + "context": 64000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -15872,63 +15442,63 @@ "supported": false }, "attachment": false, - "open_weights": false, + "open_weights": true, "knowledge": "2024-04", - "release_date": "2024-09-19", - "last_updated": "2024-09-19", + "release_date": "2024-04-17", + "last_updated": "2024-04-17", "cost": { - "input": 0.287, - "output": 0.861 - }, - "type": "chat" + "input": 2, + "output": 6 + } }, { - "id": "qwen-mt-turbo", - "name": "Qwen Mt Turbo", - "display_name": "Qwen Mt Turbo", + "id": "vercel/v0-1.0-md", + "name": "v0-1.0-md", + "display_name": "v0-1.0-md", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 128000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01", - "last_updated": "2025-01", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.101, - "output": 0.28 - }, - "type": "chat" + "input": 3, + "output": 15 + } }, { - "id": "deepseek-r1-distill-llama-8b", - "name": "DeepSeek R1 Distill Llama 8B", - "display_name": "DeepSeek R1 Distill Llama 8B", + "id": "vercel/v0-1.5-md", + "name": "v0-1.5-md", + "display_name": "v0-1.5-md", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -15936,20 +15506,19 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-06-09", + "last_updated": "2025-06-09", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 3, + "output": 15 + } }, { - "id": "qwen3-coder-480b-a35b-instruct", - "name": "Qwen3-Coder 480B-A35B Instruct", - "display_name": "Qwen3-Coder 480B-A35B Instruct", + "id": "deepseek/deepseek-v3", + "name": "DeepSeek V3 0324", + "display_name": "DeepSeek V3 0324", "modalities": { "input": [ "text" @@ -15959,8 +15528,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 163840, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -15968,20 +15537,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2024-12-26", + "last_updated": "2024-12-26", "cost": { - "input": 0.861, - "output": 3.441 - }, - "type": "chat" + "input": 0.77, + "output": 0.77 + } }, { - "id": "qwen-mt-plus", - "name": "Qwen Mt Plus", - "display_name": "Qwen Mt Plus", + "id": "deepseek/deepseek-v3.2-thinking", + "name": "DeepSeek V3.2 Thinking", + "display_name": "DeepSeek V3.2 Thinking", "modalities": { "input": [ "text" @@ -15991,29 +15559,30 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 128000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01", - "last_updated": "2025-01", + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.259, - "output": 0.775 - }, - "type": "chat" + "input": 0.28, + "output": 0.42, + "cache_read": 0.03 + } }, { - "id": "qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "deepseek/deepseek-v3.1-terminus", + "name": "DeepSeek V3.1 Terminus", + "display_name": "DeepSeek V3.1 Terminus", "modalities": { "input": [ "text" @@ -16023,29 +15592,29 @@ ] }, "limit": { - "context": 262144, + "context": 131072, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 0.861, - "output": 3.441 - }, - "type": "chat" + "input": 0.27, + "output": 1 + } }, { - "id": "qwq-32b", - "name": "QwQ 32B", - "display_name": "QwQ 32B", + "id": "deepseek/deepseek-v3.1", + "name": "DeepSeek-V3.1", + "display_name": "DeepSeek-V3.1", "modalities": { "input": [ "text" @@ -16055,8 +15624,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 163840, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -16065,20 +15634,19 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-12", - "last_updated": "2024-12", + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0.287, - "output": 0.861 - }, - "type": "chat" + "input": 0.3, + "output": 1 + } }, { - "id": "qwen2-5-math-7b-instruct", - "name": "Qwen2.5-Math 7B Instruct", - "display_name": "Qwen2.5-Math 7B Instruct", + "id": "deepseek/deepseek-v3.2-exp", + "name": "DeepSeek V3.2 Exp", + "display_name": "DeepSeek V3.2 Exp", "modalities": { "input": [ "text" @@ -16088,29 +15656,29 @@ ] }, "limit": { - "context": 4096, - "output": 3072 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "open_weights": false, + "knowledge": "2025-09", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.144, - "output": 0.287 - }, - "type": "chat" + "input": 0.27, + "output": 0.4 + } }, { - "id": "qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen3 Next 80B A3B Thinking", + "id": "deepseek/deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -16120,35 +15688,29 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 163842, + "output": 8000 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09", - "last_updated": "2025-09", + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.144, - "output": 1.434 - }, - "type": "chat" + "input": 0.27, + "output": 0.4, + "cache_read": 0.22 + } }, { - "id": "deepseek-r1-distill-qwen-1-5b", - "name": "DeepSeek R1 Distill Qwen 1.5B", - "display_name": "DeepSeek R1 Distill Qwen 1.5B", + "id": "deepseek/deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ "text" @@ -16158,8 +15720,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -16169,226 +15731,200 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-29", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 1.35, + "output": 5.4 + } }, { - "id": "qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "recraft/recraft-v3", + "name": "Recraft V3", + "display_name": "Recraft V3", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 512, + "output": 0 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", - "cost": { - "input": 0.287, - "output": 1.147, - "reasoning": 2.868 - }, - "type": "chat" + "open_weights": false, + "release_date": "2024-10", + "last_updated": "2024-10" }, { - "id": "qwen-vl-plus", - "name": "Qwen-VL Plus", - "display_name": "Qwen-VL Plus", + "id": "recraft/recraft-v2", + "name": "Recraft V2", + "display_name": "Recraft V2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 512, + "output": 0 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01-25", - "last_updated": "2025-08-15", - "cost": { - "input": 0.115, - "output": 0.287 - }, - "type": "chat" + "release_date": "2024-03", + "last_updated": "2024-03" }, { - "id": "qwen3-coder-plus", - "name": "Qwen3 Coder Plus", - "display_name": "Qwen3 Coder Plus", + "id": "bfl/flux-kontext-pro", + "name": "FLUX.1 Kontext Pro", + "display_name": "FLUX.1 Kontext Pro", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 512, + "output": 0 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", - "cost": { - "input": 1, - "output": 5 - }, - "type": "chat" + "open_weights": false, + "release_date": "2025-06", + "last_updated": "2025-06" }, { - "id": "qwen3-coder-plus-2025-09-23", - "name": "Qwen3 Coder Plus 2025 09 23", - "display_name": "Qwen3 Coder Plus 2025 09 23", + "id": "bfl/flux-kontext-max", + "name": "FLUX.1 Kontext Max", + "display_name": "FLUX.1 Kontext Max", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 512, + "output": 0 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "release_date": "2025-06", + "last_updated": "2025-06" }, { - "id": "qwen3-coder-plus-2025-07-22", - "name": "Qwen3 Coder Plus 2025 07 22", - "display_name": "Qwen3 Coder Plus 2025 07 22", + "id": "bfl/flux-pro-1.1", + "name": "FLUX1.1 [pro]", + "display_name": "FLUX1.1 [pro]", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 512, + "output": 0 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "release_date": "2024-10", + "last_updated": "2024-10" }, { - "id": "qwen-vl-ocr-latest", - "name": "Qwen Vl Ocr Latest", - "display_name": "Qwen Vl Ocr Latest", + "id": "bfl/flux-pro-1.1-ultra", + "name": "FLUX1.1 [pro] Ultra", + "display_name": "FLUX1.1 [pro] Ultra", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 34096, - "output": 4096 + "context": 512, + "output": 0 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "release_date": "2024-11", + "last_updated": "2024-11" }, { - "id": "qvq-max-2025-05-15", - "name": "Qvq Max 2025 05 15", - "display_name": "Qvq Max 2025 05 15", + "id": "bfl/flux-pro-1.0-fill", + "name": "FLUX.1 Fill [pro]", + "display_name": "FLUX.1 Fill [pro]", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 512, + "output": 0 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 16384, - "min": 0, - "max": 16384 - } + "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "release_date": "2024-10", + "last_updated": "2024-10" }, { - "id": "qwen-turbo-latest", - "name": "Qwen Turbo Latest", - "display_name": "Qwen Turbo Latest", + "id": "arcee-ai/trinity-mini", + "name": "Trinity Mini", + "display_name": "Trinity Mini", "modalities": { "input": [ "text" @@ -16399,32 +15935,27 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-12", + "last_updated": "2025-12", + "cost": { + "input": 0.05, + "output": 0.15 + } }, { - "id": "qwen-turbo-2024-09-19", - "name": "Qwen Turbo 2024 09 19", - "display_name": "Qwen Turbo 2024 09 19", + "id": "arcee-ai/trinity-large-preview", + "name": "Trinity Large Preview", + "display_name": "Trinity Large Preview", "modalities": { "input": [ "text" @@ -16434,8 +15965,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -16443,12 +15974,19 @@ "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-01", + "last_updated": "2025-01", + "cost": { + "input": 0.25, + "output": 1 + } }, { - "id": "qwen-flash-2025-07-28", - "name": "Qwen Flash 2025 07 28", - "display_name": "Qwen Flash 2025 07 28", + "id": "minimax/minimax-m2", + "name": "MiniMax M2", + "display_name": "MiniMax M2", "modalities": { "input": [ "text" @@ -16458,33 +15996,31 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 262114, + "output": 262114 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true }, "attachment": false, - "type": "chat" + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", + "cost": { + "input": 0.27, + "output": 1.15, + "cache_read": 0.03, + "cache_write": 0.38 + } }, { - "id": "qwen-plus-latest", - "name": "Qwen Plus Latest", - "display_name": "Qwen Plus Latest", + "id": "minimax/minimax-m2.1-lightning", + "name": "MiniMax M2.1 Lightning", + "display_name": "MiniMax M2.1 Lightning", "modalities": { "input": [ "text" @@ -16494,33 +16030,31 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true }, "attachment": false, - "type": "chat" + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", + "cost": { + "input": 0.3, + "output": 2.4, + "cache_read": 0.03, + "cache_write": 0.38 + } }, { - "id": "qwen-plus-2024-09-19", - "name": "Qwen Plus 2024 09 19", - "display_name": "Qwen Plus 2024 09 19", + "id": "minimax/minimax-m2.1", + "name": "MiniMax M2.1", + "display_name": "MiniMax M2.1", "modalities": { "input": [ "text" @@ -16530,21 +16064,31 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "type": "chat" + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.38 + } }, { - "id": "qwen-plus-2025-07-14", - "name": "Qwen Plus 2025 07 14", - "display_name": "Qwen Plus 2025 07 14", + "id": "bytedance/seed-1.6", + "name": "Seed 1.6", + "display_name": "Seed 1.6", "modalities": { "input": [ "text" @@ -16554,69 +16098,64 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true }, "attachment": false, - "type": "chat" + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-09", + "last_updated": "2025-09", + "cost": { + "input": 0.25, + "output": 2, + "cache_read": 0.05 + } }, { - "id": "qwen-plus-2025-09-11", - "name": "Qwen Plus 2025 09 11", - "display_name": "Qwen Plus 2025 09 11", + "id": "bytedance/seed-1.8", + "name": "Seed 1.8", + "display_name": "Seed 1.8", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true }, "attachment": false, - "type": "chat" + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-10", + "last_updated": "2025-10", + "cost": { + "input": 0.25, + "output": 2, + "cache_read": 0.05 + } }, { - "id": "qwen-max-latest", - "name": "Qwen Max Latest", - "display_name": "Qwen Max Latest", + "id": "voyage/voyage-code-2", + "name": "voyage-code-2", + "display_name": "voyage-code-2", "modalities": { "input": [ "text" @@ -16626,27 +16165,27 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, - "type": "chat" + "open_weights": false, + "release_date": "2024-01", + "last_updated": "2024-01", + "cost": { + "input": 0.12, + "output": 0 + } }, { - "id": "qwen-max-2024-09-19", - "name": "Qwen Max 2024 09 19", - "display_name": "Qwen Max 2024 09 19", + "id": "voyage/voyage-3.5-lite", + "name": "voyage-3.5-lite", + "display_name": "voyage-3.5-lite", "modalities": { "input": [ "text" @@ -16656,27 +16195,27 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, - "type": "chat" + "open_weights": false, + "release_date": "2025-05-20", + "last_updated": "2025-05-20", + "cost": { + "input": 0.02, + "output": 0 + } }, { - "id": "qwen-max-2024-04-28", - "name": "Qwen Max 2024 04 28", - "display_name": "Qwen Max 2024 04 28", + "id": "voyage/voyage-3.5", + "name": "voyage-3.5", + "display_name": "voyage-3.5", "modalities": { "input": [ "text" @@ -16686,21 +16225,27 @@ ] }, "limit": { - "context": 8000, - "output": 2000 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "release_date": "2025-05-20", + "last_updated": "2025-05-20", + "cost": { + "input": 0.06, + "output": 0 + } }, { - "id": "qwen-max-2024-04-03", - "name": "Qwen Max 2024 04 03", - "display_name": "Qwen Max 2024 04 03", + "id": "voyage/voyage-finance-2", + "name": "voyage-finance-2", + "display_name": "voyage-finance-2", "modalities": { "input": [ "text" @@ -16710,21 +16255,27 @@ ] }, "limit": { - "context": 8000, - "output": 2000 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, - "reasoning": { + "temperature": false, + "tool_call": false, + "reasoning": { "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "release_date": "2024-03", + "last_updated": "2024-03", + "cost": { + "input": 0.12, + "output": 0 + } }, { - "id": "qwen-max-2025-01-25", - "name": "Qwen Max 2025 01 25", - "display_name": "Qwen Max 2025 01 25", + "id": "voyage/voyage-law-2", + "name": "voyage-law-2", + "display_name": "voyage-law-2", "modalities": { "input": [ "text" @@ -16734,27 +16285,27 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, - "type": "chat" + "open_weights": false, + "release_date": "2024-03", + "last_updated": "2024-03", + "cost": { + "input": 0.12, + "output": 0 + } }, { - "id": "qwen3-max-2025-09-23", - "name": "Qwen3 Max 20250923", - "display_name": "Qwen3 Max 20250923", + "id": "voyage/voyage-code-3", + "name": "voyage-code-3", + "display_name": "voyage-code-3", "modalities": { "input": [ "text" @@ -16764,27 +16315,27 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, - "type": "chat" + "open_weights": false, + "release_date": "2024-09", + "last_updated": "2024-09", + "cost": { + "input": 0.18, + "output": 0 + } }, { - "id": "qwen3-max-preview", - "name": "Qwen3 Max Preview", - "display_name": "Qwen3 Max Preview", + "id": "voyage/voyage-3-large", + "name": "voyage-3-large", + "display_name": "voyage-3-large", "modalities": { "input": [ "text" @@ -16794,27 +16345,27 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, - "type": "chat" + "open_weights": false, + "release_date": "2024-09", + "last_updated": "2024-09", + "cost": { + "input": 0.18, + "output": 0 + } }, { - "id": "qwen3-235b-a22b-thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "google/gemini-embedding-001", + "name": "Gemini Embedding 001", + "display_name": "Gemini Embedding 001", "modalities": { "input": [ "text" @@ -16824,195 +16375,216 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 8192, + "output": 1536 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "release_date": "2025-05-20", + "last_updated": "2025-05-20", + "cost": { + "input": 0.15, + "output": 0 + } }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "google/imagen-4.0-ultra-generate-001", + "name": "Imagen 4 Ultra", + "display_name": "Imagen 4 Ultra", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 480, + "output": 0 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "release_date": "2025-05-24", + "last_updated": "2025-05-24" }, { - "id": "qwen3-30b-a3b-instruct-2507", - "name": "Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen3 30B A3B Instruct 2507", + "id": "google/gemini-2.5-flash-image", + "name": "Nano Banana (Gemini 2.5 Flash Image)", + "display_name": "Nano Banana (Gemini 2.5 Flash Image)", "modalities": { "input": [ "text" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 131072, + "context": 32768, "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-03-20", + "cost": { + "input": 0.3, + "output": 2.5 + } }, { - "id": "qwen3-30b-a3b-thinking-2507", - "name": "Qwen3 30B A3B Thinking 2507", - "display_name": "Qwen3 30B A3B Thinking 2507", + "id": "google/imagen-4.0-fast-generate-001", + "name": "Imagen 4 Fast", + "display_name": "Imagen 4 Fast", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 480, + "output": 0 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "release_date": "2025-06", + "last_updated": "2025-06" }, { - "id": "qwen3-30b-a3b", - "name": "Qwen3 30B A3B", - "display_name": "Qwen3 30B A3B", + "id": "google/imagen-4.0-generate-001", + "name": "Imagen 4", + "display_name": "Imagen 4", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 480, + "output": 0 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "release_date": "2025-05-22", + "last_updated": "2025-05-22" }, { - "id": "qwen3-4b", - "name": "Qwen3 4B", - "display_name": "Qwen3 4B", + "id": "google/gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "default": true }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "cost": { + "input": 2, + "output": 12, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } + } }, { - "id": "qwen3-1.7b", - "name": "Qwen3 1.7B", - "display_name": "Qwen3 1.7B", + "id": "google/gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 30720, - "min": 0, - "max": 30720 - } + "default": true }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.01 + } }, { - "id": "qwen3-0.6b", - "name": "Qwen3 0.6B", - "display_name": "Qwen3 0.6B", + "id": "google/text-multilingual-embedding-002", + "name": "Text Multilingual Embedding 002", + "display_name": "Text Multilingual Embedding 002", "modalities": { "input": [ "text" @@ -17022,58 +16594,59 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 30720, - "min": 0, - "max": 30720 - } + "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "release_date": "2024-03", + "last_updated": "2024-03", + "cost": { + "input": 0.03, + "output": 0 + } }, { - "id": "qwen3-vl-plus-2025-09-23", - "name": "Qwen3 VL Plus 2025 09 23", - "display_name": "Qwen3 VL Plus 2025 09 23", + "id": "google/gemini-3-pro-image", + "name": "Nano Banana Pro (Gemini 3 Pro Image)", + "display_name": "Nano Banana Pro (Gemini 3 Pro Image)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 262144, + "context": 65536, "output": 32768 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "knowledge": "2025-03", + "release_date": "2025-09", + "last_updated": "2025-09", + "cost": { + "input": 2, + "output": 120 + } }, { - "id": "qwq-plus-latest", - "name": "QwQ Plus Latest", - "display_name": "QwQ Plus Latest", + "id": "google/text-embedding-005", + "name": "Text Embedding 005", + "display_name": "Text Embedding 005", "modalities": { "input": [ "text" @@ -17083,106 +16656,59 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 8192, + "output": 1536 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 32768, - "min": 0, - "max": 32768 - } - }, - "search": { "supported": false }, "attachment": false, - "type": "chat" - } - ] - }, - "venice": { - "id": "venice", - "name": "Venice AI", - "display_name": "Venice AI", - "api": "https://api.venice.ai/api/v1", - "doc": "https://docs.venice.ai", - "models": [ - { - "id": "grok-41-fast", - "name": "Grok 4.1 Fast", - "display_name": "Grok 4.1 Fast", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 65536 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-29", + "release_date": "2024-08", + "last_updated": "2024-08", "cost": { - "input": 0.5, - "output": 1.25, - "cache_read": 0.125 - }, - "type": "chat" + "input": 0.03, + "output": 0 + } }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen 3 235B A22B Instruct 2507", - "display_name": "Qwen 3 235B A22B Instruct 2507", + "id": "google/gemini-2.5-flash-image-preview", + "name": "Nano Banana Preview (Gemini 2.5 Flash Image Preview)", + "display_name": "Nano Banana Preview (Gemini 2.5 Flash Image Preview)", "modalities": { "input": [ "text" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 131072, + "context": 32768, "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-04-29", - "last_updated": "2025-12-18", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-03-20", "cost": { - "input": 0.15, - "output": 0.75 - }, - "type": "chat" + "input": 0.3, + "output": 2.5 + } }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "google/gemini-2.5-flash-preview-09-2025", + "name": "Gemini 2.5 Flash Preview 09-25", + "display_name": "Gemini 2.5 Flash Preview 09-25", "modalities": { "input": [ "text", @@ -17196,7 +16722,7 @@ ] }, "limit": { - "context": 262144, + "context": 1048576, "output": 65536 }, "temperature": true, @@ -17208,19 +16734,19 @@ "attachment": true, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-12-19", - "last_updated": "2025-12-30", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.7, - "output": 3.75, - "cache_read": 0.07 - }, - "type": "chat" + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "cache_write": 0.383 + } }, { - "id": "claude-opus-45", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "google/gemini-3-flash", + "name": "Gemini 3 Flash", + "display_name": "Gemini 3 Flash", "modalities": { "input": [ "text", @@ -17232,8 +16758,8 @@ ] }, "limit": { - "context": 202752, - "output": 50688 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -17244,62 +16770,69 @@ "attachment": true, "open_weights": false, "knowledge": "2025-03", - "release_date": "2025-12-06", - "last_updated": "2025-12-29", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 6, - "output": 30, - "cache_read": 0.6 - }, - "type": "chat" + "input": 0.5, + "output": 3, + "cache_read": 0.05 + } }, { - "id": "mistral-31-24b", - "name": "Venice Medium", - "display_name": "Venice Medium", + "id": "google/gemini-2.5-flash-lite-preview-09-2025", + "name": "Gemini 2.5 Flash Lite Preview 09-25", + "display_name": "Gemini 2.5 Flash Lite Preview 09-25", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2025-03-18", - "last_updated": "2025-12-18", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.5, - "output": 2 - }, - "type": "chat" + "input": 0.1, + "output": 0.4, + "cache_read": 0.01 + } }, { - "id": "grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 1048576, "output": 65536 }, "temperature": true, @@ -17308,100 +16841,107 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-01", - "last_updated": "2026-01-02", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.25, - "output": 1.87, - "cache_read": 0.03 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.31 + } }, { - "id": "zai-org-glm-4.7", - "name": "GLM 4.7", - "display_name": "GLM 4.7", + "id": "google/gemini-2.0-flash", + "name": "Gemini 2.0 Flash", + "display_name": "Gemini 2.0 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 50688 + "context": 1048576, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-24", - "last_updated": "2026-01-07", + "attachment": true, + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.55, - "output": 2.65 - }, - "type": "chat" + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + } }, { - "id": "venice-uncensored", - "name": "Venice Uncensored 1.1", - "display_name": "Venice Uncensored 1.1", + "id": "google/gemini-2.0-flash-lite", + "name": "Gemini 2.0 Flash Lite", + "display_name": "Gemini 2.0 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, + "context": 1048576, "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2025-03-18", - "last_updated": "2025-12-18", + "attachment": true, + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.2, - "output": 0.9 - }, - "type": "chat" + "input": 0.075, + "output": 0.3 + } }, { - "id": "gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", "image", "audio", - "video" + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 50688 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -17411,20 +16951,20 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-12-02", - "last_updated": "2025-12-29", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.625 - }, - "type": "chat" + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "input_audio": 1 + } }, { - "id": "openai-gpt-52", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "prime-intellect/intellect-3", + "name": "INTELLECT 3", + "display_name": "INTELLECT 3", "modalities": { "input": [ "text" @@ -17434,8 +16974,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -17445,20 +16985,18 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-13", - "last_updated": "2025-12-29", + "knowledge": "2024-10", + "release_date": "2025-11-26", + "last_updated": "2025-11-26", "cost": { - "input": 2.19, - "output": 17.5, - "cache_read": 0.219 - }, - "type": "chat" + "input": 0.2, + "output": 1.1 + } }, { - "id": "qwen3-4b", - "name": "Venice Small", - "display_name": "Venice Small", + "id": "inception/mercury-coder-small", + "name": "Mercury Coder Small Beta", + "display_name": "Mercury Coder Small Beta", "modalities": { "input": [ "text" @@ -17468,30 +17006,28 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 32000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-04-29", - "last_updated": "2025-12-18", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-02-26", + "last_updated": "2025-02-26", "cost": { - "input": 0.05, - "output": 0.15 - }, - "type": "chat" + "input": 0.25, + "output": 1 + } }, { - "id": "llama-3.3-70b", - "name": "Llama 3.3 70B", - "display_name": "Llama 3.3 70B", + "id": "openai/text-embedding-3-small", + "name": "text-embedding-3-small", + "display_name": "text-embedding-3-small", "modalities": { "input": [ "text" @@ -17501,61 +17037,62 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-04-06", - "last_updated": "2025-12-29", + "open_weights": false, + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 0.7, - "output": 2.8 - }, - "type": "chat" + "input": 0.02, + "output": 0 + } }, { - "id": "openai-gpt-oss-120b", - "name": "OpenAI GPT OSS 120B", - "display_name": "OpenAI GPT OSS 120B", + "id": "openai/gpt-5.2-chat", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-11-06", - "last_updated": "2025-12-29", + "attachment": true, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.07, - "output": 0.3 - }, - "type": "chat" + "input": 1.75, + "output": 14, + "cache_read": 0.18 + } }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "openai/gpt-oss-safeguard-20b", + "name": "gpt-oss-safeguard-20b", + "display_name": "gpt-oss-safeguard-20b", "modalities": { "input": [ "text" @@ -17565,7 +17102,7 @@ ] }, "limit": { - "context": 262144, + "context": 131072, "output": 65536 }, "temperature": true, @@ -17575,32 +17112,33 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2025-12-10", - "last_updated": "2025-12-30", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.75, - "output": 3.2, - "cache_read": 0.375 - }, - "type": "chat" + "input": 0.08, + "output": 0.3, + "cache_read": 0.04 + } }, { - "id": "qwen3-235b-a22b-thinking-2507", - "name": "Qwen 3 235B A22B Thinking 2507", - "display_name": "Qwen 3 235B A22B Thinking 2507", + "id": "openai/gpt-5.2-codex", + "name": "GPT-5.2-Codex", + "display_name": "GPT-5.2-Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -17608,161 +17146,171 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-04-29", - "last_updated": "2025-12-18", + "attachment": true, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-12", + "last_updated": "2025-12", "cost": { - "input": 0.45, - "output": 3.5 - }, - "type": "chat" + "input": 1.75, + "output": 14, + "cache_read": 0.175 + } }, { - "id": "llama-3.2-3b", - "name": "Llama 3.2 3B", - "display_name": "Llama 3.2 3B", + "id": "openai/gpt-5.1-codex", + "name": "GPT-5.1-Codex", + "display_name": "GPT-5.1-Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-10-03", - "last_updated": "2025-12-18", + "attachment": true, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.15, - "output": 0.6 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.13 + } }, { - "id": "google-gemma-3-27b-it", - "name": "Google Gemma 3 27B Instruct", - "display_name": "Google Gemma 3 27B Instruct", + "id": "openai/gpt-5-chat", + "name": "GPT-5 Chat", + "display_name": "GPT-5 Chat", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 202752, - "output": 50688 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-11-04", - "last_updated": "2025-12-29", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.12, - "output": 0.2 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.13 + } }, { - "id": "hermes-3-llama-3.1-405b", - "name": "Hermes 3 Llama 3.1 405b", - "display_name": "Hermes 3 Llama 3.1 405b", + "id": "openai/o3-deep-research", + "name": "o3-deep-research", + "display_name": "o3-deep-research", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2025-09-25", - "last_updated": "2025-12-29", + "attachment": true, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-06-26", + "last_updated": "2024-06-26", "cost": { - "input": 1.1, - "output": 3 - }, - "type": "chat" + "input": 10, + "output": 40, + "cache_read": 2.5 + } }, { - "id": "zai-org-glm-4.6v", - "name": "GLM 4.6V", - "display_name": "GLM 4.6V", + "id": "openai/gpt-3.5-turbo", + "name": "GPT-3.5 Turbo", + "display_name": "GPT-3.5 Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 16385, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-12-11", - "last_updated": "2025-12-29", + "attachment": false, + "open_weights": false, + "knowledge": "2021-09", + "release_date": "2023-03-01", + "last_updated": "2023-03-01", "cost": { - "input": 0.39, - "output": 1.13 - }, - "type": "chat" + "input": 0.5, + "output": 1.5 + } }, { - "id": "minimax-m21", - "name": "MiniMax M2.1", - "display_name": "MiniMax M2.1", + "id": "openai/gpt-5.2-pro", + "name": "GPT 5.2 ", + "display_name": "GPT 5.2 ", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 50688 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -17770,21 +17318,20 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-01", - "last_updated": "2026-01-02", + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.04 - }, - "type": "chat" + "input": 21, + "output": 168 + } }, { - "id": "qwen3-next-80b", - "name": "Qwen 3 Next 80b", - "display_name": "Qwen 3 Next 80b", + "id": "openai/text-embedding-3-large", + "name": "text-embedding-3-large", + "display_name": "text-embedding-3-large", "modalities": { "input": [ "text" @@ -17794,168 +17341,134 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-04-29", - "last_updated": "2025-12-18", + "open_weights": false, + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 0.35, - "output": 1.9 - }, - "type": "chat" + "input": 0.13, + "output": 0 + } }, { - "id": "zai-org-glm-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "openai/gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex mini", + "display_name": "GPT-5.1 Codex mini", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 50688 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2025-10-18", - "last_updated": "2025-12-29", + "attachment": true, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-05-16", + "last_updated": "2025-05-16", "cost": { - "input": 0.85, - "output": 2.75 - }, - "type": "chat" + "input": 0.25, + "output": 2, + "cache_read": 0.03 + } }, { - "id": "qwen3-coder-480b-a35b-instruct", - "name": "Qwen 3 Coder 480b", - "display_name": "Qwen 3 Coder 480b", + "id": "openai/gpt-5.1-instant", + "name": "GPT-5.1 Instant", + "display_name": "GPT-5.1 Instant", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-04-29", - "last_updated": "2025-12-18", + "attachment": true, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.75, - "output": 3 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.13 + } }, { - "id": "deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "openai/gpt-5.1-thinking", + "name": "GPT 5.1 Thinking", + "display_name": "GPT 5.1 Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 163840, - "output": 40960 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-10", - "release_date": "2025-12-04", - "last_updated": "2025-12-29", - "cost": { - "input": 0.4, - "output": 1, - "cache_read": 0.2 - }, - "type": "chat" - } - ] - }, - "siliconflow": { - "id": "siliconflow", - "name": "SiliconFlow", - "display_name": "SiliconFlow", - "api": "https://api.siliconflow.cn/v1", - "doc": "https://cloud.siliconflow.com/models", - "models": [ - { - "id": "inclusionAI/Ring-flash-2.0", - "name": "inclusionAI/Ring-flash-2.0", - "display_name": "inclusionAI/Ring-flash-2.0", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-11-25", + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.14, - "output": 0.57 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.13 + } }, { - "id": "inclusionAI/Ling-flash-2.0", - "name": "inclusionAI/Ling-flash-2.0", - "display_name": "inclusionAI/Ling-flash-2.0", + "id": "openai/text-embedding-ada-002", + "name": "text-embedding-ada-002", + "display_name": "text-embedding-ada-002", "modalities": { "input": [ "text" @@ -17965,70 +17478,74 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", + "release_date": "2022-12-15", + "last_updated": "2022-12-15", "cost": { - "input": 0.14, - "output": 0.57 - }, - "type": "chat" + "input": 0.1, + "output": 0 + } }, { - "id": "inclusionAI/Ling-mini-2.0", - "name": "inclusionAI/Ling-mini-2.0", - "display_name": "inclusionAI/Ling-mini-2.0", + "id": "openai/o3-pro", + "name": "o3 Pro", + "display_name": "o3 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-10", - "last_updated": "2025-11-25", + "knowledge": "2024-10", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.07, - "output": 0.28 - }, - "type": "chat" + "input": 20, + "output": 80 + } }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "moonshotai/Kimi-K2-Thinking", - "display_name": "moonshotai/Kimi-K2-Thinking", + "id": "openai/gpt-5.1-codex-max", + "name": "GPT 5.1 Codex Max", + "display_name": "GPT 5.1 Codex Max", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -18036,20 +17553,21 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-11-07", - "last_updated": "2025-11-25", + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.55, - "output": 2.5 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.13 + } }, { - "id": "moonshotai/Kimi-K2-Instruct-0905", - "name": "moonshotai/Kimi-K2-Instruct-0905", - "display_name": "moonshotai/Kimi-K2-Instruct-0905", + "id": "openai/gpt-3.5-turbo-instruct", + "name": "GPT-3.5 Turbo Instruct", + "display_name": "GPT-3.5 Turbo Instruct", "modalities": { "input": [ "text" @@ -18059,59 +17577,63 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 8192, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-08", - "last_updated": "2025-11-25", + "knowledge": "2021-09", + "release_date": "2023-03-01", + "last_updated": "2023-03-01", "cost": { - "input": 0.4, + "input": 1.5, "output": 2 - }, - "type": "chat" + } }, { - "id": "moonshotai/Kimi-Dev-72B", - "name": "moonshotai/Kimi-Dev-72B", - "display_name": "moonshotai/Kimi-Dev-72B", + "id": "openai/codex-mini", + "name": "Codex Mini", + "display_name": "Codex Mini", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 100000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-06-19", - "last_updated": "2025-11-25", + "knowledge": "2024-10", + "release_date": "2025-05-16", + "last_updated": "2025-05-16", "cost": { - "input": 0.29, - "output": 1.15 - }, - "type": "chat" + "input": 1.5, + "output": 6, + "cache_read": 0.38 + } }, { - "id": "moonshotai/Kimi-K2-Instruct", - "name": "moonshotai/Kimi-K2-Instruct", - "display_name": "moonshotai/Kimi-K2-Instruct", + "id": "openai/gpt-4o-mini-search-preview", + "name": "GPT 4o Mini Search Preview", + "display_name": "GPT 4o Mini Search Preview", "modalities": { "input": [ "text" @@ -18121,28 +17643,28 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-07-13", - "last_updated": "2025-11-25", + "knowledge": "2023-09", + "release_date": "2025-01", + "last_updated": "2025-01", "cost": { - "input": 0.58, - "output": 2.29 - }, - "type": "chat" + "input": 0.15, + "output": 0.6 + } }, { - "id": "tencent/Hunyuan-A13B-Instruct", - "name": "tencent/Hunyuan-A13B-Instruct", - "display_name": "tencent/Hunyuan-A13B-Instruct", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -18153,27 +17675,28 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-06-30", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.14, - "output": 0.57 - }, - "type": "chat" + "input": 0.07, + "output": 0.3 + } }, { - "id": "tencent/Hunyuan-MT-7B", - "name": "tencent/Hunyuan-MT-7B", - "display_name": "tencent/Hunyuan-MT-7B", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -18184,195 +17707,213 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.1, + "output": 0.5 + } }, { - "id": "MiniMaxAI/MiniMax-M1-80k", - "name": "MiniMaxAI/MiniMax-M1-80k", - "display_name": "MiniMaxAI/MiniMax-M1-80k", + "id": "openai/gpt-5-pro", + "name": "GPT-5 pro", + "display_name": "GPT-5 pro", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 272000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-06-17", - "last_updated": "2025-11-25", + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.55, - "output": 2.2 - }, - "type": "chat" + "input": 15, + "output": 120 + } }, { - "id": "MiniMaxAI/MiniMax-M2", - "name": "MiniMaxAI/MiniMax-M2", - "display_name": "MiniMaxAI/MiniMax-M2", + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 197000, - "output": 131000 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-10-28", - "last_updated": "2025-11-25", + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.3, - "output": 1.2 - }, - "type": "chat" + "input": 1.75, + "output": 14, + "cache_read": 0.18 + } }, { - "id": "THUDM/GLM-Z1-32B-0414", - "name": "THUDM/GLM-Z1-32B-0414", - "display_name": "THUDM/GLM-Z1-32B-0414", + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.14, - "output": 0.57 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.125 + } }, { - "id": "THUDM/GLM-4-9B-0414", - "name": "THUDM/GLM-4-9B-0414", - "display_name": "THUDM/GLM-4-9B-0414", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.086, - "output": 0.086 - }, - "type": "chat" + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 + } }, { - "id": "THUDM/GLM-Z1-9B-0414", - "name": "THUDM/GLM-Z1-9B-0414", - "display_name": "THUDM/GLM-Z1-9B-0414", + "id": "openai/o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.086, - "output": 0.086 - }, - "type": "chat" + "input": 2, + "output": 8, + "cache_read": 0.5 + } }, { - "id": "THUDM/GLM-4.1V-9B-Thinking", - "name": "THUDM/GLM-4.1V-9B-Thinking", - "display_name": "THUDM/GLM-4.1V-9B-Thinking", + "id": "openai/gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -18380,123 +17921,132 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-07-04", - "last_updated": "2025-11-25", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.035, - "output": 0.14 - }, - "type": "chat" + "input": 0.25, + "output": 2, + "cache_read": 0.025 + } }, { - "id": "THUDM/GLM-4-32B-0414", - "name": "THUDM/GLM-4-32B-0414", - "display_name": "THUDM/GLM-4-32B-0414", + "id": "openai/o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 0.27, - "output": 0.27 - }, - "type": "chat" + "input": 15, + "output": 60, + "cache_read": 7.5 + } }, { - "id": "openai/gpt-oss-120b", - "name": "openai/gpt-oss-120b", - "display_name": "openai/gpt-oss-120b", + "id": "openai/o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 8000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-13", - "last_updated": "2025-11-25", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.05, - "output": 0.45 - }, - "type": "chat" - }, + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 + } + }, { - "id": "openai/gpt-oss-20b", - "name": "openai/gpt-oss-20b", - "display_name": "openai/gpt-oss-20b", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 8000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-13", - "last_updated": "2025-11-25", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.04, - "output": 0.18 - }, - "type": "chat" + "input": 2, + "output": 8, + "cache_read": 0.5 + } }, { - "id": "stepfun-ai/step3", - "name": "stepfun-ai/step3", - "display_name": "stepfun-ai/step3", + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -18505,31 +18055,33 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-08-06", - "last_updated": "2025-11-25", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "cost": { - "input": 0.57, - "output": 1.42 - }, - "type": "chat" + "input": 2.5, + "output": 10, + "cache_read": 1.25 + } }, { - "id": "nex-agi/DeepSeek-V3.1-Nex-N1", - "name": "nex-agi/DeepSeek-V3.1-Nex-N1", - "display_name": "nex-agi/DeepSeek-V3.1-Nex-N1", + "id": "openai/gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -18537,49 +18089,53 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-11-25", + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.5, - "output": 2 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.125 + } }, { - "id": "baidu/ERNIE-4.5-300B-A47B", - "name": "baidu/ERNIE-4.5-300B-A47B", - "display_name": "baidu/ERNIE-4.5-300B-A47B", + "id": "openai/gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-02", - "last_updated": "2025-11-25", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.28, - "output": 1.1 - }, - "type": "chat" + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 + } }, { - "id": "z-ai/GLM-4.5-Air", - "name": "z-ai/GLM-4.5-Air", - "display_name": "z-ai/GLM-4.5-Air", + "id": "openai/o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ "text" @@ -18589,121 +18145,128 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 0.14, - "output": 0.86 - }, - "type": "chat" + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + } }, { - "id": "z-ai/GLM-4.5", - "name": "z-ai/GLM-4.5", - "display_name": "z-ai/GLM-4.5", + "id": "openai/gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 0.4, - "output": 2 - }, - "type": "chat" + "input": 10, + "output": 30 + } }, { - "id": "ByteDance-Seed/Seed-OSS-36B-Instruct", - "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", - "display_name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-04", - "last_updated": "2025-11-25", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.21, - "output": 0.57 - }, - "type": "chat" + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 + } }, { - "id": "meta-llama/Meta-Llama-3.1-8B-Instruct", - "name": "meta-llama/Meta-Llama-3.1-8B-Instruct", - "display_name": "meta-llama/Meta-Llama-3.1-8B-Instruct", + "id": "openai/gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-23", - "last_updated": "2025-11-25", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.06, - "output": 0.06 - }, - "type": "chat" + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 + } }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", - "name": "Qwen/Qwen3-Next-80B-A3B-Thinking", - "display_name": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "id": "perplexity/sonar-reasoning", + "name": "Sonar Reasoning", + "display_name": "Sonar Reasoning", "modalities": { "input": [ "text" @@ -18713,91 +18276,61 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 127000, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-11-25", - "cost": { - "input": 0.14, - "output": 0.57 - }, - "type": "chat" - }, - { - "id": "Qwen/Qwen2.5-14B-Instruct", - "name": "Qwen/Qwen2.5-14B-Instruct", - "display_name": "Qwen/Qwen2.5-14B-Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "knowledge": "2025-09", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.1, - "output": 0.1 - }, - "type": "chat" + "input": 1, + "output": 5 + } }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "id": "perplexity/sonar", + "name": "Sonar", + "display_name": "Sonar", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 127000, + "output": 8000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", + "knowledge": "2025-02", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.14, - "output": 1.4 - }, - "type": "chat" + "input": 1, + "output": 1 + } }, { - "id": "Qwen/Qwen3-VL-32B-Instruct", - "name": "Qwen/Qwen3-VL-32B-Instruct", - "display_name": "Qwen/Qwen3-VL-32B-Instruct", + "id": "perplexity/sonar-pro", + "name": "Sonar Pro", + "display_name": "Sonar Pro", "modalities": { "input": [ "text", @@ -18808,8 +18341,8 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 200000, + "output": 8000 }, "temperature": true, "tool_call": true, @@ -18818,18 +18351,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-10-21", - "last_updated": "2025-11-25", + "knowledge": "2025-09", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.2, - "output": 0.6 - }, - "type": "chat" + "input": 3, + "output": 15 + } }, { - "id": "Qwen/Qwen3-Omni-30B-A3B-Thinking", - "name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", - "display_name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "id": "perplexity/sonar-reasoning-pro", + "name": "Sonar Reasoning Pro", + "display_name": "Sonar Reasoning Pro", "modalities": { "input": [ "text" @@ -18839,29 +18372,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 127000, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "knowledge": "2025-09", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.1, - "output": 0.4 - }, - "type": "chat" + "input": 2, + "output": 8 + } }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "display_name": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "id": "zai/glm-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ "text" @@ -18871,8 +18404,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 202752, + "output": 120000 }, "temperature": true, "tool_call": true, @@ -18882,30 +18415,32 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", + "knowledge": "2024-10", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.13, - "output": 0.6 - }, - "type": "chat" + "input": 0.43, + "output": 1.75, + "cache_read": 0.08 + } }, { - "id": "Qwen/Qwen3-VL-32B-Thinking", - "name": "Qwen/Qwen3-VL-32B-Thinking", - "display_name": "Qwen/Qwen3-VL-32B-Thinking", + "id": "zai/glm-4.6v-flash", + "name": "GLM-4.6V-Flash", + "display_name": "GLM-4.6V-Flash", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 128000, + "output": 24000 }, "temperature": true, "tool_call": true, @@ -18915,18 +18450,14 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-10-21", - "last_updated": "2025-11-25", - "cost": { - "input": 0.2, - "output": 1.5 - }, - "type": "chat" + "knowledge": "2024-10", + "release_date": "2025-09-30", + "last_updated": "2025-09-30" }, { - "id": "Qwen/Qwen3-VL-30B-A3B-Thinking", - "name": "Qwen/Qwen3-VL-30B-A3B-Thinking", - "display_name": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "id": "zai/glm-4.5", + "name": "GLM 4.5", + "display_name": "GLM 4.5", "modalities": { "input": [ "text" @@ -18937,7 +18468,7 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 131072 }, "temperature": true, "tool_call": true, @@ -18945,20 +18476,20 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-11", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.29, - "output": 1 - }, - "type": "chat" + "input": 0.6, + "output": 2.2 + } }, { - "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "name": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "display_name": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "id": "zai/glm-4.5-air", + "name": "GLM 4.5 Air", + "display_name": "GLM 4.5 Air", "modalities": { "input": [ "text" @@ -18968,39 +18499,41 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 96000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-30", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.09, - "output": 0.3 - }, - "type": "chat" + "input": 0.2, + "output": 1.1 + } }, { - "id": "Qwen/Qwen3-VL-235B-A22B-Thinking", - "name": "Qwen/Qwen3-VL-235B-A22B-Thinking", - "display_name": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "id": "zai/glm-4.5v", + "name": "GLM 4.5V", + "display_name": "GLM 4.5V", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 66000, + "output": 66000 }, "temperature": true, "tool_call": true, @@ -19009,19 +18542,19 @@ "default": true }, "attachment": true, - "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-08", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "cost": { - "input": 0.45, - "output": 3.5 - }, - "type": "chat" + "input": 0.6, + "output": 1.8 + } }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "display_name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "id": "zai/glm-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ "text" @@ -19031,27 +18564,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 96000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-31", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.25, - "output": 1 + "input": 0.45, + "output": 1.8 } }, { - "id": "Qwen/Qwen3-VL-235B-A22B-Instruct", - "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", - "display_name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "id": "zai/glm-4.7-flashx", + "name": "GLM 4.7 FlashX", + "display_name": "GLM 4.7 FlashX", "modalities": { "input": [ "text" @@ -19061,123 +18596,128 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-01", + "last_updated": "2025-01", "cost": { - "input": 0.3, - "output": 1.5 - }, - "type": "chat" + "input": 0.06, + "output": 0.4, + "cache_read": 0.01 + } }, { - "id": "Qwen/Qwen3-VL-8B-Instruct", - "name": "Qwen/Qwen3-VL-8B-Instruct", - "display_name": "Qwen/Qwen3-VL-8B-Instruct", + "id": "zai/glm-4.6v", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 128000, + "output": 24000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-11-25", + "knowledge": "2024-10", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.18, - "output": 0.68 - }, - "type": "chat" + "input": 0.3, + "output": 0.9, + "cache_read": 0.05 + } }, { - "id": "Qwen/Qwen3-32B", - "name": "Qwen/Qwen3-32B", - "display_name": "Qwen/Qwen3-32B", + "id": "amazon/nova-2-lite", + "name": "Nova 2 Lite", + "display_name": "Nova 2 Lite", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 1000000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.14, - "output": 0.57 - }, - "type": "chat" + "input": 0.3, + "output": 2.5 + } }, { - "id": "Qwen/Qwen2.5-VL-7B-Instruct", - "name": "Qwen/Qwen2.5-VL-7B-Instruct", - "display_name": "Qwen/Qwen2.5-VL-7B-Instruct", + "id": "amazon/titan-embed-text-v2", + "name": "Titan Text Embeddings V2", + "display_name": "Titan Text Embeddings V2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-01-28", - "last_updated": "2025-11-25", + "release_date": "2024-04", + "last_updated": "2024-04", "cost": { - "input": 0.05, - "output": 0.05 - }, - "type": "chat" + "input": 0.02, + "output": 0 + } }, { - "id": "Qwen/QwQ-32B", - "name": "Qwen/QwQ-32B", - "display_name": "Qwen/QwQ-32B", + "id": "amazon/nova-micro", + "name": "Nova Micro", + "display_name": "Nova Micro", "modalities": { "input": [ "text" @@ -19187,7 +18727,7 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, "temperature": true, @@ -19197,28 +18737,31 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-03-06", - "last_updated": "2025-11-25", + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.15, - "output": 0.58 - }, - "type": "chat" + "input": 0.035, + "output": 0.14, + "cache_read": 0.00875 + } }, { - "id": "Qwen/Qwen2.5-VL-72B-Instruct", - "name": "Qwen/Qwen2.5-VL-72B-Instruct", - "display_name": "Qwen/Qwen2.5-VL-72B-Instruct", + "id": "amazon/nova-pro", + "name": "Nova Pro", + "display_name": "Nova Pro", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 300000, "output": 8192 }, "temperature": true, @@ -19228,28 +18771,31 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-01-28", - "last_updated": "2025-11-25", + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.59, - "output": 0.59 - }, - "type": "chat" + "input": 0.8, + "output": 3.2, + "cache_read": 0.2 + } }, { - "id": "Qwen/Qwen3-235B-A22B", - "name": "Qwen/Qwen3-235B-A22B", - "display_name": "Qwen/Qwen3-235B-A22B", + "id": "amazon/nova-lite", + "name": "Nova Lite", + "display_name": "Nova Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 300000, "output": 8192 }, "temperature": true, @@ -19257,20 +18803,21 @@ "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.35, - "output": 1.42 - }, - "type": "chat" + "input": 0.06, + "output": 0.24, + "cache_read": 0.015 + } }, { - "id": "Qwen/Qwen2.5-7B-Instruct", - "name": "Qwen/Qwen2.5-7B-Instruct", - "display_name": "Qwen/Qwen2.5-7B-Instruct", + "id": "morph/morph-v3-fast", + "name": "Morph v3 Fast", + "display_name": "Morph v3 Fast", "modalities": { "input": [ "text" @@ -19280,28 +18827,27 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 16000, + "output": 16000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "cost": { - "input": 0.05, - "output": 0.05 - }, - "type": "chat" + "input": 0.8, + "output": 1.2 + } }, { - "id": "Qwen/Qwen3-Coder-30B-A3B-Instruct", - "name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "id": "morph/morph-v3-large", + "name": "Morph v3 Large", + "display_name": "Morph v3 Large", "modalities": { "input": [ "text" @@ -19311,27 +18857,27 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32000, + "output": 32000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-01", - "last_updated": "2025-11-25", + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "cost": { - "input": 0.07, - "output": 0.28 + "input": 0.9, + "output": 1.9 } }, { - "id": "Qwen/Qwen2.5-72B-Instruct", - "name": "Qwen/Qwen2.5-72B-Instruct", - "display_name": "Qwen/Qwen2.5-72B-Instruct", + "id": "meta/llama-3.1-8b", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ "text" @@ -19342,7 +18888,7 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -19351,28 +18897,29 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.59, - "output": 0.59 - }, - "type": "chat" + "input": 0.03, + "output": 0.05 + } }, { - "id": "Qwen/Qwen2.5-72B-Instruct-128K", - "name": "Qwen/Qwen2.5-72B-Instruct-128K", - "display_name": "Qwen/Qwen2.5-72B-Instruct-128K", + "id": "meta/llama-3.2-90b", + "name": "Llama 3.2 90B Vision Instruct", + "display_name": "Llama 3.2 90B Vision Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, "temperature": true, @@ -19380,20 +18927,20 @@ "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.59, - "output": 0.59 - }, - "type": "chat" + "input": 0.72, + "output": 0.72 + } }, { - "id": "Qwen/Qwen2.5-32B-Instruct", - "name": "Qwen/Qwen2.5-32B-Instruct", - "display_name": "Qwen/Qwen2.5-32B-Instruct", + "id": "meta/llama-3.2-1b", + "name": "Llama 3.2 1B Instruct", + "display_name": "Llama 3.2 1B Instruct", "modalities": { "input": [ "text" @@ -19403,38 +18950,39 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-09-19", - "last_updated": "2025-11-25", + "knowledge": "2023-12", + "release_date": "2024-09-18", + "last_updated": "2024-09-18", "cost": { - "input": 0.18, - "output": 0.18 - }, - "type": "chat" + "input": 0.1, + "output": 0.1 + } }, { - "id": "Qwen/Qwen2.5-Coder-32B-Instruct", - "name": "Qwen/Qwen2.5-Coder-32B-Instruct", - "display_name": "Qwen/Qwen2.5-Coder-32B-Instruct", + "id": "meta/llama-3.2-11b", + "name": "Llama 3.2 11B Vision Instruct", + "display_name": "Llama 3.2 11B Vision Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, "temperature": true, @@ -19442,19 +18990,20 @@ "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-11-11", - "last_updated": "2025-11-25", + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.18, - "output": 0.18 + "input": 0.16, + "output": 0.16 } }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "display_name": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "id": "meta/llama-3.2-3b", + "name": "Llama 3.2 3B Instruct", + "display_name": "Llama 3.2 3B Instruct", "modalities": { "input": [ "text" @@ -19464,72 +19013,71 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-07-23", - "last_updated": "2025-11-25", + "knowledge": "2023-12", + "release_date": "2024-09-18", + "last_updated": "2024-09-18", "cost": { - "input": 0.09, - "output": 0.6 - }, - "type": "chat" + "input": 0.15, + "output": 0.15 + } }, { - "id": "Qwen/Qwen3-VL-8B-Thinking", - "name": "Qwen/Qwen3-VL-8B-Thinking", - "display_name": "Qwen/Qwen3-VL-8B-Thinking", + "id": "meta/llama-3.1-70b", + "name": "Llama 3.1 70B Instruct", + "display_name": "Llama 3.1 70B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-11-25", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.18, - "output": 2 - }, - "type": "chat" + "input": 0.4, + "output": 0.4 + } }, { - "id": "Qwen/Qwen3-Omni-30B-A3B-Instruct", - "name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "id": "meta/llama-4-scout", + "name": "Llama-4-Scout-17B-16E-Instruct-FP8", + "display_name": "Llama-4-Scout-17B-16E-Instruct-FP8", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -19537,19 +19085,19 @@ "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.1, - "output": 0.4 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "Qwen/Qwen3-8B", - "name": "Qwen/Qwen3-8B", - "display_name": "Qwen/Qwen3-8B", + "id": "meta/llama-3.3-70b", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -19559,39 +19107,40 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "attachment": true, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.06, - "output": 0.06 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "Qwen/Qwen3-Omni-30B-A3B-Captioner", - "name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", - "display_name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "id": "meta/llama-4-maverick", + "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -19599,60 +19148,67 @@ "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.1, - "output": 0.4 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "Qwen/Qwen2.5-VL-32B-Instruct", - "name": "Qwen/Qwen2.5-VL-32B-Instruct", - "display_name": "Qwen/Qwen2.5-VL-32B-Instruct", + "id": "anthropic/claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-03-24", - "last_updated": "2025-11-25", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.27, - "output": 0.27 - }, - "type": "chat" + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 + } }, { - "id": "Qwen/Qwen3-14B", - "name": "Qwen/Qwen3-14B", - "display_name": "Qwen/Qwen3-14B", + "id": "anthropic/claude-3.5-sonnet-20240620", + "name": "Claude 3.5 Sonnet (2024-06-20)", + "display_name": "Claude 3.5 Sonnet (2024-06-20)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 200000, "output": 8192 }, "temperature": true, @@ -19660,62 +19216,69 @@ "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "knowledge": "2024-04", + "release_date": "2024-06-20", + "last_updated": "2024-06-20", "cost": { - "input": 0.07, - "output": 0.28 - }, - "type": "chat" + "input": 3, + "output": 15 + } }, { - "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", - "name": "Qwen/Qwen3-VL-30B-A3B-Instruct", - "display_name": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "id": "anthropic/claude-opus-4.5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-10-05", - "last_updated": "2025-11-25", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.29, - "output": 1 - }, - "type": "chat" + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 18.75 + } }, { - "id": "Qwen/Qwen3-30B-A3B-Thinking-2507", - "name": "Qwen/Qwen3-30B-A3B-Thinking-2507", - "display_name": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "id": "anthropic/claude-opus-4.6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -19723,92 +19286,106 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-31", - "last_updated": "2025-11-25", + "knowledge": "2025-05", + "release_date": "2026-02", + "last_updated": "2026-02", "cost": { - "input": 0.09, - "output": 0.3 - }, - "type": "chat" + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + } }, { - "id": "Qwen/Qwen3-30B-A3B", - "name": "Qwen/Qwen3-30B-A3B", - "display_name": "Qwen/Qwen3-30B-A3B", + "id": "anthropic/claude-sonnet-4.5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.09, - "output": 0.45 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "zai-org/GLM-4.5-Air", - "name": "zai-org/GLM-4.5-Air", - "display_name": "zai-org/GLM-4.5-Air", + "id": "anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.14, - "output": 0.86 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "zai-org/GLM-4.5V", - "name": "zai-org/GLM-4.5V", - "display_name": "zai-org/GLM-4.5V", + "id": "anthropic/claude-3.5-haiku", + "name": "Claude Haiku 3.5", + "display_name": "Claude Haiku 3.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 200000, "output": 8192 }, "temperature": true, @@ -19818,186 +19395,210 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-08-13", - "last_updated": "2025-11-25", + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.14, - "output": 0.86 - }, - "type": "chat" + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 + } }, { - "id": "zai-org/GLM-4.6", - "name": "zai-org/GLM-4.6", - "display_name": "zai-org/GLM-4.6", + "id": "anthropic/claude-3.7-sonnet", + "name": "Claude Sonnet 3.7", + "display_name": "Claude Sonnet 3.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "knowledge": "2024-10-31", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.5, - "output": 1.9 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "zai-org/GLM-4.5", - "name": "zai-org/GLM-4.5", - "display_name": "zai-org/GLM-4.5", + "id": "anthropic/claude-opus-4.1", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.4, - "output": 2 - }, - "type": "chat" + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } }, { - "id": "deepseek-ai/DeepSeek-V3.1", - "name": "deepseek-ai/DeepSeek-V3.1", - "display_name": "deepseek-ai/DeepSeek-V3.1", + "id": "anthropic/claude-3.5-sonnet", + "name": "Claude Sonnet 3.5 v2", + "display_name": "Claude Sonnet 3.5 v2", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-25", - "last_updated": "2025-11-25", + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.27, - "output": 1 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "deepseek-ai/DeepSeek-V3", - "name": "deepseek-ai/DeepSeek-V3", - "display_name": "deepseek-ai/DeepSeek-V3", + "id": "anthropic/claude-3-opus", + "name": "Claude Opus 3", + "display_name": "Claude Opus 3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-26", - "last_updated": "2025-11-25", + "knowledge": "2023-08-31", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", "cost": { - "input": 0.25, - "output": 1 - }, - "type": "chat" + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "id": "anthropic/claude-3-haiku", + "name": "Claude Haiku 3", + "display_name": "Claude Haiku 3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-11-25", + "knowledge": "2023-08-31", + "release_date": "2024-03-13", + "last_updated": "2024-03-13", "cost": { - "input": 0.05, - "output": 0.05 - }, - "type": "chat" + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 + } }, { - "id": "deepseek-ai/DeepSeek-V3.1-Terminus", - "name": "deepseek-ai/DeepSeek-V3.1-Terminus", - "display_name": "deepseek-ai/DeepSeek-V3.1-Terminus", + "id": "anthropic/claude-opus-4", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -20005,20 +19606,31 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-11-25", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.27, - "output": 1 - }, - "type": "chat" - }, + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } + } + ] + }, + "nebius": { + "id": "nebius", + "name": "Nebius Token Factory", + "display_name": "Nebius Token Factory", + "api": "https://api.tokenfactory.nebius.com/v1", + "doc": "https://docs.tokenfactory.nebius.com/", + "models": [ { - "id": "deepseek-ai/DeepSeek-V3.2-Exp", - "name": "deepseek-ai/DeepSeek-V3.2-Exp", - "display_name": "deepseek-ai/DeepSeek-V3.2-Exp", + "id": "NousResearch/hermes-4-70b", + "name": "Hermes-4-70B", + "display_name": "Hermes-4-70B", "modalities": { "input": [ "text" @@ -20028,28 +19640,32 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-10-10", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-11", + "release_date": "2026-01-30", + "last_updated": "2026-02-04", "cost": { - "input": 0.27, - "output": 0.41 - }, - "type": "chat" + "input": 0.13, + "output": 0.4, + "reasoning": 0.4, + "cache_read": 0.013, + "cache_write": 0.16 + } }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "id": "NousResearch/hermes-4-405b", + "name": "Hermes-4-405B", + "display_name": "Hermes-4-405B", "modalities": { "input": [ "text" @@ -20059,7 +19675,7 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, "temperature": true, @@ -20069,19 +19685,22 @@ "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-11", + "release_date": "2026-01-30", + "last_updated": "2026-02-04", "cost": { - "input": 0.1, - "output": 0.1 - }, - "type": "chat" + "input": 1, + "output": 3, + "reasoning": 3, + "cache_read": 0.1, + "cache_write": 1.25 + } }, { - "id": "deepseek-ai/deepseek-vl2", - "name": "deepseek-ai/deepseek-vl2", - "display_name": "deepseek-ai/deepseek-vl2", + "id": "intfloat/e5-mistral-7b-instruct", + "name": "e5-mistral-7b-instruct", + "display_name": "e5-mistral-7b-instruct", "modalities": { "input": [ "text" @@ -20091,28 +19710,28 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32768, + "output": 0 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-12-13", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-01-01", + "last_updated": "2026-02-04", "cost": { - "input": 0.15, - "output": 0.15 - }, - "type": "chat" + "input": 0.01, + "output": 0 + } }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "id": "moonshotai/kimi-k2-thinking", + "name": "Kimi-K2-Thinking", + "display_name": "Kimi-K2-Thinking", "modalities": { "input": [ "text" @@ -20122,8 +19741,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -20131,52 +19750,57 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-11-25", + "attachment": true, + "open_weights": true, + "knowledge": "2025-10", + "release_date": "2026-01-05", + "last_updated": "2026-02-04", "cost": { - "input": 0.18, - "output": 0.18 - }, - "type": "chat" + "input": 0.6, + "output": 2.5, + "reasoning": 2.5, + "cache_read": 0.06, + "cache_write": 0.75 + } }, { - "id": "deepseek-ai/DeepSeek-R1", - "name": "deepseek-ai/DeepSeek-R1", - "display_name": "deepseek-ai/DeepSeek-R1", + "id": "moonshotai/kimi-k2-instruct", + "name": "Kimi-K2-Instruct", + "display_name": "Kimi-K2-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 200000, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-11-25", + "knowledge": "2025-10", + "release_date": "2026-01-05", + "last_updated": "2026-02-04", "cost": { "input": 0.5, - "output": 2.18 - }, - "type": "chat" + "output": 2.4, + "cache_read": 0.05, + "cache_write": 0.625 + } }, { - "id": "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", - "name": "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", - "display_name": "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", + "id": "MiniMaxAI/minimax-m2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" @@ -20186,20 +19810,32 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-10", + "release_date": "2026-02-01", + "last_updated": "2026-02-04", + "cost": { + "input": 0.3, + "output": 1.2, + "reasoning": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 + } }, { - "id": "Pro/deepseek-ai/DeepSeek-V3.2-Exp", - "name": "Pro/deepseek-ai/DeepSeek-V3.2-Exp", - "display_name": "Pro/deepseek-ai/DeepSeek-V3.2-Exp", + "id": "nvidia/nemotron-nano-v2-12b", + "name": "Nemotron-Nano-V2-12b", + "display_name": "Nemotron-Nano-V2-12b", "modalities": { "input": [ "text" @@ -20209,19 +19845,30 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-03-15", + "last_updated": "2026-02-04", + "cost": { + "input": 0.07, + "output": 0.2, + "cache_read": 0.007, + "cache_write": 0.08 + } }, { - "id": "Pro/deepseek-ai/DeepSeek-R1", - "name": "Pro/deepseek-ai/DeepSeek-R1", - "display_name": "Pro/deepseek-ai/DeepSeek-R1", + "id": "nvidia/llama-3_1-nemotron-ultra-253b-v1", + "name": "Llama-3.1-Nemotron-Ultra-253B-v1", + "display_name": "Llama-3.1-Nemotron-Ultra-253B-v1", "modalities": { "input": [ "text" @@ -20231,20 +19878,30 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-15", + "last_updated": "2026-02-04", + "cost": { + "input": 0.6, + "output": 1.8, + "cache_read": 0.06, + "cache_write": 0.75 + } }, { - "id": "Pro/deepseek-ai/DeepSeek-V3", - "name": "Pro/deepseek-ai/DeepSeek-V3", - "display_name": "Pro/deepseek-ai/DeepSeek-V3", + "id": "nvidia/nvidia-nemotron-3-nano-30b-a3b", + "name": "Nemotron-3-Nano-30B-A3B", + "display_name": "Nemotron-3-Nano-30B-A3B", "modalities": { "input": [ "text" @@ -20254,19 +19911,30 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" - }, - { - "id": "inclusionAI/Ring-1T", - "name": "inclusionAI/Ring-1T", - "display_name": "inclusionAI/Ring-1T", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2025-08-10", + "last_updated": "2026-02-04", + "cost": { + "input": 0.06, + "output": 0.24, + "cache_read": 0.006, + "cache_write": 0.075 + } + }, + { + "id": "PrimeIntellect/intellect-3", + "name": "INTELLECT-3", + "display_name": "INTELLECT-3", "modalities": { "input": [ "text" @@ -20276,20 +19944,30 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-10", + "release_date": "2026-01-25", + "last_updated": "2026-02-04", + "cost": { + "input": 0.2, + "output": 1.1, + "cache_read": 0.02, + "cache_write": 0.25 + } }, { - "id": "inclusionAI/Ling-1T", - "name": "inclusionAI/Ling-1T", - "display_name": "inclusionAI/Ling-1T", + "id": "BAAI/bge-en-icl", + "name": "BGE-ICL", + "display_name": "BGE-ICL", "modalities": { "input": [ "text" @@ -20299,19 +19977,28 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32768, + "output": 0 }, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2024-07-30", + "last_updated": "2026-02-04", + "cost": { + "input": 0.01, + "output": 0 + } }, { - "id": "Pro/moonshotai/Kimi-K2-Instruct-0905", - "name": "Pro/moonshotai/Kimi-K2-Instruct-0905", - "display_name": "Pro/moonshotai/Kimi-K2-Instruct-0905", + "id": "BAAI/bge-multilingual-gemma2", + "name": "bge-multilingual-gemma2", + "display_name": "bge-multilingual-gemma2", "modalities": { "input": [ "text" @@ -20321,124 +20008,230 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 8192, + "output": 0 }, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2024-07-30", + "last_updated": "2026-02-04", + "cost": { + "input": 0.01, + "output": 0 + } }, { - "id": "Qwen/Qwen-Image-Edit-2509", - "name": "Qwen/Qwen-Image-Edit-2509", - "display_name": "Qwen/Qwen-Image-Edit-2509", + "id": "google/gemma-2-9b-it-fast", + "name": "Gemma-2-9b-it (Fast)", + "display_name": "Gemma-2-9b-it (Fast)", "modalities": { "input": [ - "image", "text" ], "output": [ - "image" + "text" ] }, + "limit": { + "context": 8192, + "output": 4096 + }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2024-06-27", + "last_updated": "2026-02-04", + "cost": { + "input": 0.03, + "output": 0.09, + "cache_read": 0.003, + "cache_write": 0.0375 } }, { - "id": "Qwen/Qwen-Image-Edit", - "name": "Qwen/Qwen-Image-Edit", - "display_name": "Qwen/Qwen-Image-Edit", + "id": "google/gemma-3-27b-it-fast", + "name": "Gemma-3-27b-it (Fast)", + "display_name": "Gemma-3-27b-it (Fast)", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, - "tool_call": false, + "limit": { + "context": 128000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-10", + "release_date": "2026-01-20", + "last_updated": "2026-02-04", + "cost": { + "input": 0.2, + "output": 0.6, + "cache_read": 0.02, + "cache_write": 0.25 } }, { - "id": "Qwen/Qwen-Image", - "name": "Qwen/Qwen-Image", - "display_name": "Qwen/Qwen-Image", + "id": "google/gemma-2-2b-it", + "name": "Gemma-2-2b-it", + "display_name": "Gemma-2-2b-it", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, + "limit": { + "context": 8192, + "output": 4096 + }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2024-07-31", + "last_updated": "2026-02-04", + "cost": { + "input": 0.02, + "output": 0.06, + "cache_read": 0.002, + "cache_write": 0.025 } }, { - "id": "Wan-AI/Wan2.2-I2V-A14B", - "name": "Wan-AI/Wan2.2-I2V-A14B", - "display_name": "Wan-AI/Wan2.2-I2V-A14B", + "id": "google/gemma-3-27b-it", + "name": "Gemma-3-27b-it", + "display_name": "Gemma-3-27b-it", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ - "video" + "text" ] }, - "tool_call": false, + "limit": { + "context": 128000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-10", + "release_date": "2026-01-20", + "last_updated": "2026-02-04", + "cost": { + "input": 0.1, + "output": 0.3, + "cache_read": 0.01, + "cache_write": 0.125 } }, { - "id": "Wan-AI/Wan2.2-T2V-A14B", - "name": "Wan-AI/Wan2.2-T2V-A14B", - "display_name": "Wan-AI/Wan2.2-T2V-A14B", + "id": "openai/gpt-oss-20b", + "name": "gpt-oss-20b", + "display_name": "gpt-oss-20b", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, - "tool_call": false, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-09", + "release_date": "2026-01-10", + "last_updated": "2026-02-04", + "cost": { + "input": 0.05, + "output": 0.2, + "cache_read": 0.005, + "cache_write": 0.06 } }, { - "id": "TeleAI/TeleSpeechASR", - "name": "TeleAI/TeleSpeechASR", - "display_name": "TeleAI/TeleSpeechASR", + "id": "openai/gpt-oss-120b", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, - "tool_call": false, + "limit": { + "context": 128000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-09", + "release_date": "2026-01-10", + "last_updated": "2026-02-04", + "cost": { + "input": 0.15, + "output": 0.6, + "reasoning": 0.6, + "cache_read": 0.015, + "cache_write": 0.18 } }, { - "id": "Pro/THUDM/GLM-4.1V-9B-Thinking", - "name": "Pro/THUDM/GLM-4.1V-9B-Thinking", - "display_name": "Pro/THUDM/GLM-4.1V-9B-Thinking", + "id": "qwen/qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -20448,20 +20241,29 @@ ] }, "limit": { - "context": 131072, + "context": 262144, "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2025-10-04", + "cost": { + "input": 0.2, + "output": 0.6 + } }, { - "id": "Tongyi-Zhiwen/QwenLong-L1-32B", - "name": "Tongyi-Zhiwen/QwenLong-L1-32B", - "display_name": "Tongyi-Zhiwen/QwenLong-L1-32B", + "id": "qwen/qwen3-32b-fast", + "name": "Qwen3-32B (Fast)", + "display_name": "Qwen3-32B (Fast)", "modalities": { "input": [ "text" @@ -20471,20 +20273,30 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2026-01-28", + "last_updated": "2026-02-04", + "cost": { + "input": 0.2, + "output": 0.6, + "cache_read": 0.02, + "cache_write": 0.25 + } }, { - "id": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", - "name": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", - "display_name": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", + "id": "qwen/qwen3-30b-a3b-thinking-2507", + "name": "Qwen3-30B-A3B-Thinking-2507", + "display_name": "Qwen3-30B-A3B-Thinking-2507", "modalities": { "input": [ "text" @@ -20494,152 +20306,228 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2026-01-28", + "last_updated": "2026-02-04", + "cost": { + "input": 0.1, + "output": 0.3, + "reasoning": 0.3, + "cache_read": 0.01, + "cache_write": 0.125 + } }, { - "id": "Qwen/Qwen3-Reranker-8B", - "name": "Qwen/Qwen3-Reranker-8B", - "display_name": "Qwen/Qwen3-Reranker-8B", + "id": "qwen/qwen2.5-vl-72b-instruct", + "name": "Qwen2.5-VL-72B-Instruct", + "display_name": "Qwen2.5-VL-72B-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "score" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 128000, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "rerank" + "attachment": true, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-20", + "last_updated": "2026-02-04", + "cost": { + "input": 0.25, + "output": 0.75, + "cache_read": 0.025, + "cache_write": 0.31 + } }, { - "id": "Qwen/Qwen3-Embedding-8B", - "name": "Qwen/Qwen3-Embedding-8B", - "display_name": "Qwen/Qwen3-Embedding-8B", + "id": "qwen/qwen3-30b-a3b-instruct-2507", + "name": "Qwen3-30B-A3B-Instruct-2507", + "display_name": "Qwen3-30B-A3B-Instruct-2507", "modalities": { "input": [ "text" ], "output": [ - "embedding" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 128000, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "embedding" + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2026-01-28", + "last_updated": "2026-02-04", + "cost": { + "input": 0.1, + "output": 0.3, + "cache_read": 0.01, + "cache_write": 0.125 + } }, { - "id": "Qwen/Qwen3-Reranker-4B", - "name": "Qwen/Qwen3-Reranker-4B", - "display_name": "Qwen/Qwen3-Reranker-4B", + "id": "qwen/qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder-30B-A3B-Instruct", + "display_name": "Qwen3-Coder-30B-A3B-Instruct", "modalities": { "input": [ "text" ], "output": [ - "score" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 128000, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "rerank" + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2026-01-28", + "last_updated": "2026-02-04", + "cost": { + "input": 0.1, + "output": 0.3, + "cache_read": 0.01, + "cache_write": 0.125 + } }, { - "id": "Qwen/Qwen3-Embedding-4B", - "name": "Qwen/Qwen3-Embedding-4B", - "display_name": "Qwen/Qwen3-Embedding-4B", + "id": "qwen/qwen3-235b-a22b-thinking-2507", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ "text" ], "output": [ - "embedding" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 262144, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "embedding" + "attachment": false, + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2025-10-04", + "cost": { + "input": 0.2, + "output": 0.8 + } }, { - "id": "Qwen/Qwen3-Reranker-0.6B", - "name": "Qwen/Qwen3-Reranker-0.6B", - "display_name": "Qwen/Qwen3-Reranker-0.6B", + "id": "qwen/qwen2.5-coder-7b-fast", + "name": "Qwen2.5-Coder-7B (Fast)", + "display_name": "Qwen2.5-Coder-7B (Fast)", "modalities": { "input": [ "text" ], "output": [ - "score" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 128000, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "rerank" + "attachment": false, + "open_weights": true, + "knowledge": "2024-09", + "release_date": "2024-09-19", + "last_updated": "2026-02-04", + "cost": { + "input": 0.03, + "output": 0.09, + "cache_read": 0.003, + "cache_write": 0.03 + } }, { - "id": "Qwen/Qwen3-Embedding-0.6B", - "name": "Qwen/Qwen3-Embedding-0.6B", - "display_name": "Qwen/Qwen3-Embedding-0.6B", + "id": "qwen/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" ], "output": [ - "embedding" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 262144, + "output": 66536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "embedding" + "attachment": false, + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-10-04", + "cost": { + "input": 0.4, + "output": 1.8 + } }, { - "id": "ascend-tribe/pangu-pro-moe", - "name": "ascend-tribe/pangu-pro-moe", - "display_name": "ascend-tribe/pangu-pro-moe", + "id": "qwen/qwen3-embedding-8b", + "name": "Qwen3-Embedding-8B", + "display_name": "Qwen3-Embedding-8B", "modalities": { "input": [ "text" @@ -20649,19 +20537,28 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32768, + "output": 0 }, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-10", + "release_date": "2026-01-10", + "last_updated": "2026-02-04", + "cost": { + "input": 0.01, + "output": 0 + } }, { - "id": "Pro/Qwen/Qwen2.5-VL-7B-Instruct", - "name": "Pro/Qwen/Qwen2.5-VL-7B-Instruct", - "display_name": "Pro/Qwen/Qwen2.5-VL-7B-Instruct", + "id": "qwen/qwen3-next-80b-a3b-thinking", + "name": "Qwen3-Next-80B-A3B-Thinking", + "display_name": "Qwen3-Next-80B-A3B-Thinking", "modalities": { "input": [ "text" @@ -20671,19 +20568,32 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2026-01-28", + "last_updated": "2026-02-04", + "cost": { + "input": 0.15, + "output": 1.2, + "reasoning": 1.2, + "cache_read": 0.015, + "cache_write": 0.18 + } }, { - "id": "Qwen/QVQ-72B-Preview", - "name": "Qwen/QVQ-72B-Preview", - "display_name": "Qwen/QVQ-72B-Preview", + "id": "qwen/qwen3-32b", + "name": "Qwen3-32B", + "display_name": "Qwen3-32B", "modalities": { "input": [ "text" @@ -20693,20 +20603,30 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2026-01-28", + "last_updated": "2026-02-04", + "cost": { + "input": 0.1, + "output": 0.3, + "cache_read": 0.01, + "cache_write": 0.125 + } }, { - "id": "deepseek-ai/DeepSeek-V2.5", - "name": "deepseek-ai/DeepSeek-V2.5", - "display_name": "deepseek-ai/DeepSeek-V2.5", + "id": "meta-llama/meta-llama-3.1-8b-instruct-fast", + "name": "Meta-Llama-3.1-8B-Instruct (Fast)", + "display_name": "Meta-Llama-3.1-8B-Instruct (Fast)", "modalities": { "input": [ "text" @@ -20716,87 +20636,96 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2024-07-23", + "last_updated": "2026-02-04", + "cost": { + "input": 0.03, + "output": 0.09, + "cache_read": 0.003, + "cache_write": 0.03 + } }, { - "id": "fnlp/MOSS-TTSD-v0.5", - "name": "fnlp/MOSS-TTSD-v0.5", - "display_name": "fnlp/MOSS-TTSD-v0.5", + "id": "meta-llama/llama-3_1-405b-instruct", + "name": "Llama-3.1-405B-Instruct", + "display_name": "Llama-3.1-405B-Instruct", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, - "tool_call": false, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-20", + "last_updated": "2026-02-04", + "cost": { + "input": 1, + "output": 3, + "cache_read": 0.1, + "cache_write": 1.25 } }, { - "id": "FunAudioLLM/CosyVoice2-0.5B", - "name": "FunAudioLLM/CosyVoice2-0.5B", - "display_name": "FunAudioLLM/CosyVoice2-0.5B", + "id": "meta-llama/llama-3.3-70b-instruct-fast", + "name": "Llama-3.3-70B-Instruct (Fast)", + "display_name": "Llama-3.3-70B-Instruct (Fast)", "modalities": { "input": [ "text" ], - "output": [ - "audio" - ] - }, - "tool_call": false, - "reasoning": { - "supported": false - } - }, - { - "id": "FunAudioLLM/SenseVoiceSmall", - "name": "FunAudioLLM/SenseVoiceSmall", - "display_name": "FunAudioLLM/SenseVoiceSmall", - "modalities": { - "input": [ - "audio" - ], "output": [ "text" ] }, - "tool_call": false, - "reasoning": { - "supported": false - } - }, - { - "id": "IndexTeam/IndexTTS-2", - "name": "IndexTeam/IndexTTS-2", - "display_name": "IndexTeam/IndexTTS-2", - "modalities": { - "input": [ - "text" - ], - "output": [ - "audio" - ] + "limit": { + "context": 128000, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-08", + "release_date": "2025-12-05", + "last_updated": "2026-02-04", + "cost": { + "input": 0.25, + "output": 0.75, + "cache_read": 0.025, + "cache_write": 0.31 } }, { - "id": "BAAI/bge-m3", - "name": "BAAI/bge-m3", - "display_name": "BAAI/bge-m3", + "id": "meta-llama/llama-3.3-70b-instruct-base", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -20806,101 +20735,96 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "embedding" + "attachment": false, + "open_weights": true, + "knowledge": "2025-08", + "release_date": "2025-12-05", + "last_updated": "2026-02-04", + "cost": { + "input": 0.13, + "output": 0.4, + "cache_read": 0.013, + "cache_write": 0.16 + } }, { - "id": "BAAI/bge-reranker-v2-m3", - "name": "BAAI/bge-reranker-v2-m3", - "display_name": "BAAI/bge-reranker-v2-m3", + "id": "meta-llama/meta-llama-3.1-8b-instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "display_name": "Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ "text" ], "output": [ - "score" - ] - }, - "limit": { - "context": 8192, - "output": 2048 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "type": "rerank" - }, - { - "id": "netease-youdao/bce-embedding-base_v1", - "name": "netease-youdao/bce-embedding-base_v1", - "display_name": "netease-youdao/bce-embedding-base_v1", - "modalities": { - "input": [ "text" - ], - "output": [ - "embedding" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 128000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "embedding" + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2024-07-23", + "last_updated": "2026-02-04", + "cost": { + "input": 0.02, + "output": 0.06, + "cache_read": 0.002, + "cache_write": 0.025 + } }, { - "id": "netease-youdao/bce-reranker-base_v1", - "name": "netease-youdao/bce-reranker-base_v1", - "display_name": "netease-youdao/bce-reranker-base_v1", + "id": "meta-llama/llama-guard-3-8b", + "name": "Llama-Guard-3-8B", + "display_name": "Llama-Guard-3-8B", "modalities": { "input": [ "text" ], "output": [ - "score" + "text" ] }, "limit": { "context": 8192, - "output": 2048 + "output": 1024 }, + "temperature": false, "tool_call": false, "reasoning": { "supported": false - } - }, - { - "id": "Kwai-Kolors/Kolors", - "name": "Kwai-Kolors/Kolors", - "display_name": "Kwai-Kolors/Kolors", - "modalities": { - "input": [ - "text" - ], - "output": [ - "image" - ] }, - "tool_call": false, - "reasoning": { - "supported": false + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-04-18", + "last_updated": "2026-02-04", + "cost": { + "input": 0.02, + "output": 0.06, + "cache_read": 0.002, + "cache_write": 0.025 } }, { - "id": "Qwen/Qwen2-VL-72B-Instruct", - "name": "Qwen/Qwen2-VL-72B-Instruct", - "display_name": "Qwen/Qwen2-VL-72B-Instruct", + "id": "zai-org/glm-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ "text" @@ -20913,16 +20837,26 @@ "context": 131072, "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-02-04", + "cost": { + "input": 0.4, + "output": 2 + } }, { - "id": "Qwen/Qwen2.5-Coder-7B-Instruct", - "name": "Qwen/Qwen2.5-Coder-7B-Instruct", - "display_name": "Qwen/Qwen2.5-Coder-7B-Instruct", + "id": "zai-org/glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ "text" @@ -20932,18 +20866,30 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-11-15", + "last_updated": "2026-02-04", + "cost": { + "input": 0.6, + "output": 2.2, + "cache_read": 0.06, + "cache_write": 0.75 } }, { - "id": "internlm/internlm2_5-7b-chat", - "name": "internlm/internlm2_5-7b-chat", - "display_name": "internlm/internlm2_5-7b-chat", + "id": "zai-org/glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ "text" @@ -20953,19 +20899,30 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-11-15", + "last_updated": "2026-02-04", + "cost": { + "input": 0.2, + "output": 1.2, + "cache_read": 0.02, + "cache_write": 0.25 + } }, { - "id": "Qwen/Qwen2-7B-Instruct", - "name": "Qwen/Qwen2-7B-Instruct", - "display_name": "Qwen/Qwen2-7B-Instruct", + "id": "zai-org/glm-4.7-fp8", + "name": "GLM-4.7 (FP8)", + "display_name": "GLM-4.7 (FP8)", "modalities": { "input": [ "text" @@ -20975,19 +20932,30 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2025-12", + "release_date": "2026-01-15", + "last_updated": "2026-02-04", + "cost": { + "input": 0.4, + "output": 2, + "cache_read": 0.04, + "cache_write": 0.5 + } }, { - "id": "THUDM/glm-4-9b-chat", - "name": "THUDM/glm-4-9b-chat", - "display_name": "THUDM/glm-4-9b-chat", + "id": "deepseek-ai/deepseek-r1-0528-fast", + "name": "DeepSeek R1 0528 Fast", + "display_name": "DeepSeek R1 0528 Fast", "modalities": { "input": [ "text" @@ -21000,16 +20968,26 @@ "context": 131072, "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-02-04", + "cost": { + "input": 2, + "output": 6 + } }, { - "id": "BAAI/bge-large-en-v1.5", - "name": "BAAI/bge-large-en-v1.5", - "display_name": "BAAI/bge-large-en-v1.5", + "id": "deepseek-ai/deepseek-r1-0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ "text" @@ -21019,19 +20997,32 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "embedding" + "attachment": false, + "open_weights": true, + "knowledge": "2025-11", + "release_date": "2026-01-15", + "last_updated": "2026-02-04", + "cost": { + "input": 0.8, + "output": 2.4, + "reasoning": 2.4, + "cache_read": 0.08, + "cache_write": 1 + } }, { - "id": "BAAI/bge-large-zh-v1.5", - "name": "BAAI/bge-large-zh-v1.5", - "display_name": "BAAI/bge-large-zh-v1.5", + "id": "deepseek-ai/deepseek-v3", + "name": "DeepSeek V3", + "display_name": "DeepSeek V3", "modalities": { "input": [ "text" @@ -21044,16 +21035,26 @@ "context": 131072, "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "embedding" + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-05-07", + "last_updated": "2026-02-04", + "cost": { + "input": 0.5, + "output": 1.5 + } }, { - "id": "LoRA/Qwen/Qwen2.5-32B-Instruct", - "name": "LoRA/Qwen/Qwen2.5-32B-Instruct", - "display_name": "LoRA/Qwen/Qwen2.5-32B-Instruct", + "id": "deepseek-ai/deepseek-v3-0324-fast", + "name": "DeepSeek-V3-0324 (Fast)", + "display_name": "DeepSeek-V3-0324 (Fast)", "modalities": { "input": [ "text" @@ -21063,19 +21064,30 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-03-24", + "last_updated": "2026-02-04", + "cost": { + "input": 0.75, + "output": 2.25, + "cache_read": 0.075, + "cache_write": 0.28125 + } }, { - "id": "LoRA/Qwen/Qwen2.5-14B-Instruct", - "name": "LoRA/Qwen/Qwen2.5-14B-Instruct", - "display_name": "LoRA/Qwen/Qwen2.5-14B-Instruct", + "id": "deepseek-ai/deepseek-v3-0324", + "name": "DeepSeek-V3-0324", + "display_name": "DeepSeek-V3-0324", "modalities": { "input": [ "text" @@ -21085,19 +21097,30 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-03-24", + "last_updated": "2026-02-04", + "cost": { + "input": 0.5, + "output": 1.5, + "cache_read": 0.05, + "cache_write": 0.1875 + } }, { - "id": "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", - "name": "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", - "display_name": "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "id": "deepseek-ai/deepseek-v3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ "text" @@ -21107,62 +21130,103 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-11", + "release_date": "2026-01-20", + "last_updated": "2026-02-04", + "cost": { + "input": 0.3, + "output": 0.45, + "reasoning": 0.45, + "cache_read": 0.03, + "cache_write": 0.375 + } }, { - "id": "deepseek-ai/DeepSeek-OCR", - "name": "deepseek-ai/DeepSeek-OCR", - "display_name": "deepseek-ai/DeepSeek-OCR", + "id": "black-forest-labs/flux-dev", + "name": "FLUX.1-dev", + "display_name": "FLUX.1-dev", "modalities": { "input": [ - "image" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 77, + "output": 0 }, + "temperature": false, "tool_call": false, "reasoning": { "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2024-08-01", + "last_updated": "2026-02-04", + "cost": { + "input": 0, + "output": 0 } }, { - "id": "Pro/Qwen/Qwen2.5-Coder-7B-Instruct", - "name": "Pro/Qwen/Qwen2.5-Coder-7B-Instruct", - "display_name": "Pro/Qwen/Qwen2.5-Coder-7B-Instruct", + "id": "black-forest-labs/flux-schnell", + "name": "FLUX.1-schnell", + "display_name": "FLUX.1-schnell", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 77, + "output": 0 }, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2024-08-01", + "last_updated": "2026-02-04", + "cost": { + "input": 0, + "output": 0 } - }, + } + ] + }, + "deepseek": { + "id": "deepseek", + "name": "DeepSeek", + "display_name": "DeepSeek", + "api": "https://api.deepseek.com", + "doc": "https://platform.deepseek.com/api-docs/pricing", + "models": [ { - "id": "Pro/BAAI/bge-m3", - "name": "Pro/BAAI/bge-m3", - "display_name": "Pro/BAAI/bge-m3", + "id": "deepseek-chat", + "name": "DeepSeek Chat", + "display_name": "DeepSeek Chat", "modalities": { "input": [ "text" @@ -21172,19 +21236,29 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "embedding" + "attachment": true, + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2024-12-26", + "last_updated": "2025-08-21", + "cost": { + "input": 0.57, + "output": 1.68, + "cache_read": 0.07 + } }, { - "id": "Pro/Qwen/Qwen2.5-7B-Instruct", - "name": "Pro/Qwen/Qwen2.5-7B-Instruct", - "display_name": "Pro/Qwen/Qwen2.5-7B-Instruct", + "id": "deepseek-reasoner", + "name": "DeepSeek Reasoner", + "display_name": "DeepSeek Reasoner", "modalities": { "input": [ "text" @@ -21194,63 +21268,101 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" - }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-08-21", + "cost": { + "input": 0.57, + "output": 1.68, + "cache_read": 0.07 + } + } + ] + }, + "alibaba-cn": { + "id": "alibaba-cn", + "name": "alibaba-cn", + "display_name": "alibaba-cn", + "api": "https://dashscope.aliyuncs.com/compatible-mode/v1", + "doc": "https://www.alibabacloud.com/help/en/model-studio/models", + "models": [ { - "id": "Pro/BAAI/bge-reranker-v2-m3", - "name": "Pro/BAAI/bge-reranker-v2-m3", - "display_name": "Pro/BAAI/bge-reranker-v2-m3", + "id": "deepseek-r1-distill-qwen-7b", + "name": "DeepSeek R1 Distill Qwen 7B", + "display_name": "DeepSeek R1 Distill Qwen 7B", "modalities": { "input": [ "text" ], "output": [ - "score" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 32768, + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "rerank" + "attachment": false, + "open_weights": false, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0.072, + "output": 0.144 + } }, { - "id": "LoRA/Qwen/Qwen2.5-72B-Instruct", - "name": "LoRA/Qwen/Qwen2.5-72B-Instruct", - "display_name": "LoRA/Qwen/Qwen2.5-72B-Instruct", + "id": "qwen3-asr-flash", + "name": "Qwen3-ASR Flash", + "display_name": "Qwen3-ASR Flash", "modalities": { "input": [ - "text" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 53248, + "output": 4096 }, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-09-08", + "last_updated": "2025-09-08", + "cost": { + "input": 0.032, + "output": 0.032 + } }, { - "id": "Pro/Qwen/Qwen2-7B-Instruct", - "name": "Pro/Qwen/Qwen2-7B-Instruct", - "display_name": "Pro/Qwen/Qwen2-7B-Instruct", + "id": "deepseek-r1-0528", + "name": "DeepSeek R1 0528", + "display_name": "DeepSeek R1 0528", "modalities": { "input": [ "text" @@ -21261,18 +21373,27 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": false, + "release_date": "2025-05-28", + "last_updated": "2025-05-28", + "cost": { + "input": 0.574, + "output": 2.294 + } }, { - "id": "LoRA/Qwen/Qwen2.5-7B-Instruct", - "name": "LoRA/Qwen/Qwen2.5-7B-Instruct", - "display_name": "LoRA/Qwen/Qwen2.5-7B-Instruct", + "id": "deepseek-v3", + "name": "DeepSeek V3", + "display_name": "DeepSeek V3", "modalities": { "input": [ "text" @@ -21282,44 +21403,68 @@ ] }, "limit": { - "context": 131072, + "context": 65536, "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" - }, - { - "id": "Pro/THUDM/glm-4-9b-chat", - "name": "Pro/THUDM/glm-4-9b-chat", - "display_name": "Pro/THUDM/glm-4-9b-chat", + "attachment": false, + "open_weights": false, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "cost": { + "input": 0.287, + "output": 1.147 + } + }, + { + "id": "qwen-omni-turbo", + "name": "Qwen-Omni Turbo", + "display_name": "Qwen-Omni Turbo", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32768, + "output": 2048 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01-19", + "last_updated": "2025-03-26", + "cost": { + "input": 0.058, + "output": 0.23, + "input_audio": 3.584, + "output_audio": 7.168 + } }, { - "id": "THUDM/GLM-Z1-Rumination-32B-0414", - "name": "THUDM/GLM-Z1-Rumination-32B-0414", - "display_name": "THUDM/GLM-Z1-Rumination-32B-0414", + "id": "qwen-vl-max", + "name": "Qwen-VL Max", + "display_name": "Qwen-VL Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -21329,187 +21474,86 @@ "context": 131072, "output": 8192 }, + "temperature": true, "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "type": "chat" - }, - { - "id": "stabilityai/stable-diffusion-xl-base-1.0", - "name": "stabilityai/stable-diffusion-xl-base-1.0", - "display_name": "stabilityai/stable-diffusion-xl-base-1.0", - "modalities": { - "input": [ - "text" - ], - "output": [ - "image" - ] - }, - "tool_call": false, "reasoning": { "supported": false - } - }, - { - "id": "black-forest-labs/FLUX.1-schnell", - "name": "black-forest-labs/FLUX.1-schnell", - "display_name": "black-forest-labs/FLUX.1-schnell", - "modalities": { - "input": [ - "text" - ], - "output": [ - "image" - ] }, - "tool_call": false, - "reasoning": { - "supported": false + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-04-08", + "last_updated": "2025-08-13", + "cost": { + "input": 0.23, + "output": 0.574 } }, { - "id": "black-forest-labs/FLUX.1-dev", - "name": "black-forest-labs/FLUX.1-dev", - "display_name": "black-forest-labs/FLUX.1-dev", + "id": "deepseek-v3-2-exp", + "name": "DeepSeek V3.2 Exp", + "display_name": "DeepSeek V3.2 Exp", "modalities": { "input": [ "text" ], "output": [ - "image" - ] - }, - "tool_call": false, - "reasoning": { - "supported": false - } - }, - { - "id": "Pro/black-forest-labs/FLUX.1-schnell", - "name": "Pro/black-forest-labs/FLUX.1-schnell", - "display_name": "Pro/black-forest-labs/FLUX.1-schnell", - "modalities": { - "input": [ "text" - ], - "output": [ - "image" ] }, - "tool_call": false, - "reasoning": { - "supported": false - } - }, - { - "id": "stabilityai/stable-diffusion-3-5-large", - "name": "stabilityai/stable-diffusion-3-5-large", - "display_name": "stabilityai/stable-diffusion-3-5-large", - "modalities": { - "input": [ - "text" - ], - "output": [ - "image" - ] + "limit": { + "context": 131072, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false - } - }, - { - "id": "fishaudio/fish-speech-1.4", - "name": "fishaudio/fish-speech-1.4", - "display_name": "fishaudio/fish-speech-1.4", - "modalities": { - "input": [ - "text" - ], - "output": [ - "audio" - ] }, - "tool_call": false, - "reasoning": { - "supported": false + "attachment": false, + "open_weights": false, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0.287, + "output": 0.431 } }, { - "id": "RVC-Boss/GPT-SoVITS", - "name": "RVC-Boss/GPT-SoVITS", - "display_name": "RVC-Boss/GPT-SoVITS", + "id": "qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ "text" ], "output": [ - "audio" - ] - }, - "tool_call": false, - "reasoning": { - "supported": false - } - }, - { - "id": "fishaudio/fish-speech-1.5", - "name": "fishaudio/fish-speech-1.5", - "display_name": "fishaudio/fish-speech-1.5", - "modalities": { - "input": [ "text" - ], - "output": [ - "audio" ] }, - "tool_call": false, - "reasoning": { - "supported": false - } - }, - { - "id": "black-forest-labs/FLUX.1-pro", - "name": "black-forest-labs/FLUX.1-pro", - "display_name": "black-forest-labs/FLUX.1-pro", - "modalities": { - "input": [ - "text" - ], - "output": [ - "image" - ] + "limit": { + "context": 131072, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false - } - }, - { - "id": "LoRA/black-forest-labs/FLUX.1-dev", - "name": "LoRA/black-forest-labs/FLUX.1-dev", - "display_name": "LoRA/black-forest-labs/FLUX.1-dev", - "modalities": { - "input": [ - "text" - ], - "output": [ - "image" - ] }, - "tool_call": false, - "reasoning": { - "supported": false + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09", + "last_updated": "2025-09", + "cost": { + "input": 0.144, + "output": 0.574 } }, { - "id": "SeedLLM/Seed-Rice-7B", - "name": "SeedLLM/Seed-Rice-7B", - "display_name": "SeedLLM/Seed-Rice-7B", + "id": "deepseek-r1", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", "modalities": { "input": [ "text" @@ -21520,27 +21564,27 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" - } - ] - }, - "chutes": { - "id": "chutes", - "name": "Chutes", - "display_name": "Chutes", - "api": "https://llm.chutes.ai/v1", - "doc": "https://llm.chutes.ai/v1/models", - "models": [ + "attachment": false, + "open_weights": false, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0.574, + "output": 2.294 + } + }, { - "id": "NousResearch/Hermes-4.3-36B", - "name": "Hermes 4.3 36B", - "display_name": "Hermes 4.3 36B", + "id": "qwen-turbo", + "name": "Qwen Turbo", + "display_name": "Qwen Turbo", "modalities": { "input": [ "text" @@ -21550,35 +21594,45 @@ ] }, "limit": { - "context": 524288, - "output": 524288 + "context": 131072, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-11-01", + "last_updated": "2025-07-15", "cost": { - "input": 0.1, - "output": 0.39, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.044, + "output": 0.087, + "reasoning": 0.431 + } }, { - "id": "NousResearch/Hermes-4-70B", - "name": "Hermes 4 70B", - "display_name": "Hermes 4 70B", + "id": "qwen3-vl-235b-a22b", + "name": "Qwen3-VL 235B-A22B", + "display_name": "Qwen3-VL 235B-A22B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -21586,7 +21640,7 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -21596,23 +21650,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.11, - "output": 0.38, - "reasoning": 0.57, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.286705, + "output": 1.14682, + "reasoning": 2.867051 + } }, { - "id": "NousResearch/Hermes-4-14B", - "name": "Hermes 4 14B", - "display_name": "Hermes 4 14B", + "id": "qwen3-coder-flash", + "name": "Qwen3 Coder Flash", + "display_name": "Qwen3 Coder Flash", "modalities": { "input": [ "text" @@ -21622,37 +21672,32 @@ ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.01, - "output": 0.05, - "reasoning": 0.075, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.144, + "output": 0.574 + } }, { - "id": "NousResearch/Hermes-4-405B-FP8-TEE", - "name": "Hermes 4 405B FP8 TEE", - "display_name": "Hermes 4 405B FP8 TEE", + "id": "qwen3-vl-30b-a3b", + "name": "Qwen3-VL 30B-A3B", + "display_name": "Qwen3-VL 30B-A3B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -21660,7 +21705,7 @@ }, "limit": { "context": 131072, - "output": 65536 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -21670,19 +21715,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-01-06", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.3, - "output": 1.2, - "reasoning": 1.8 - }, - "type": "chat" + "input": 0.108, + "output": 0.431, + "reasoning": 1.076 + } }, { - "id": "NousResearch/DeepHermes-3-Mistral-24B-Preview", - "name": "DeepHermes 3 Mistral 24B Preview", - "display_name": "DeepHermes 3 Mistral 24B Preview", + "id": "qwen3-14b", + "name": "Qwen3 14B", + "display_name": "Qwen3 14B", "modalities": { "input": [ "text" @@ -21692,32 +21737,35 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.02, - "output": 0.1, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.144, + "output": 0.574, + "reasoning": 1.434 + } }, { - "id": "rednote-hilab/dots.ocr", - "name": "dots.ocr", - "display_name": "dots.ocr", + "id": "qvq-max", + "name": "QVQ Max", + "display_name": "QVQ Max", "modalities": { "input": [ "text", @@ -21729,34 +21777,32 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 0.01, - "output": 0.01, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 1.147, + "output": 4.588 + } }, { - "id": "moonshotai/Kimi-K2-Instruct-0905", - "name": "Kimi K2 Instruct 0905", - "display_name": "Kimi K2 Instruct 0905", + "id": "kimi-k2.5", + "name": "Moonshot Kimi K2.5", + "display_name": "Moonshot Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -21764,31 +21810,27 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 0.39, - "output": 1.9, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.574, + "output": 2.411 + } }, { - "id": "moonshotai/Kimi-K2-Thinking-TEE", - "name": "Kimi K2 Thinking TEE", - "display_name": "Kimi K2 Thinking TEE", + "id": "deepseek-r1-distill-qwen-32b", + "name": "DeepSeek R1 Distill Qwen 32B", + "display_name": "DeepSeek R1 Distill Qwen 32B", "modalities": { "input": [ "text" @@ -21798,8 +21840,8 @@ ] }, "limit": { - "context": 262144, - "output": 65535 + "context": 32768, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -21808,24 +21850,18 @@ "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.4, - "output": 1.75, - "reasoning": 2.625, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.287, + "output": 0.861 + } }, { - "id": "MiniMaxAI/MiniMax-M2.1-TEE", - "name": "MiniMax M2.1 TEE", - "display_name": "MiniMax M2.1 TEE", + "id": "qwen-plus-character", + "name": "Qwen Plus Character", + "display_name": "Qwen Plus Character", "modalities": { "input": [ "text" @@ -21835,34 +21871,28 @@ ] }, "limit": { - "context": 196608, - "output": 65536 + "context": 32768, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01", + "last_updated": "2024-01", "cost": { - "input": 0.3, - "output": 1.2, - "reasoning": 1.8, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.115, + "output": 0.287 + } }, { - "id": "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16", - "name": "NVIDIA Nemotron 3 Nano 30B A3B BF16", - "display_name": "NVIDIA Nemotron 3 Nano 30B A3B BF16", + "id": "qwen2-5-14b-instruct", + "name": "Qwen2.5 14B Instruct", + "display_name": "Qwen2.5 14B Instruct", "modalities": { "input": [ "text" @@ -21872,9 +21902,9 @@ ] }, "limit": { - "context": 262144, - "output": 262144 - }, + "context": 131072, + "output": 8192 + }, "temperature": true, "tool_call": true, "reasoning": { @@ -21882,22 +21912,18 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.06, - "output": 0.24, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.144, + "output": 0.431 + } }, { - "id": "tngtech/DeepSeek-R1T-Chimera", - "name": "DeepSeek R1T Chimera", - "display_name": "DeepSeek R1T Chimera", + "id": "qwq-plus", + "name": "QwQ Plus", + "display_name": "QwQ Plus", "modalities": { "input": [ "text" @@ -21907,34 +21933,40 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 32768, + "min": 0, + "max": 32768 + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-03-05", + "last_updated": "2025-03-05", "cost": { - "input": 0.3, - "output": 1.2, - "reasoning": 1.8, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.23, + "output": 0.574 + } }, { - "id": "tngtech/DeepSeek-TNG-R1T2-Chimera-TEE", - "name": "DeepSeek TNG R1T2 Chimera TEE", - "display_name": "DeepSeek TNG R1T2 Chimera TEE", + "id": "qwen2-5-coder-32b-instruct", + "name": "Qwen2.5-Coder 32B Instruct", + "display_name": "Qwen2.5-Coder 32B Instruct", "modalities": { "input": [ "text" @@ -21944,30 +21976,28 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-01-06", - "last_updated": "2025-01-06", + "knowledge": "2024-04", + "release_date": "2024-11", + "last_updated": "2024-11", "cost": { - "input": 0.25, - "output": 0.85, - "reasoning": 1.275 - }, - "type": "chat" + "input": 0.287, + "output": 0.861 + } }, { - "id": "tngtech/DeepSeek-TNG-R1T2-Chimera", - "name": "DeepSeek TNG R1T2 Chimera", - "display_name": "DeepSeek TNG R1T2 Chimera", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder 30B-A3B Instruct", + "display_name": "Qwen3-Coder 30B-A3B Instruct", "modalities": { "input": [ "text" @@ -21977,34 +22007,28 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.25, - "output": 0.85, - "reasoning": 1.275, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.216, + "output": 0.861 + } }, { - "id": "tngtech/TNG-R1T-Chimera-TEE", - "name": "TNG R1T Chimera TEE", - "display_name": "TNG R1T Chimera TEE", + "id": "qwen-math-plus", + "name": "Qwen Math Plus", + "display_name": "Qwen Math Plus", "modalities": { "input": [ "text" @@ -22014,45 +22038,40 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 4096, + "output": 3072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-08-16", + "last_updated": "2024-09-19", "cost": { - "input": 0.25, - "output": 0.85, - "reasoning": 1.275, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.574, + "output": 1.721 + } }, { - "id": "XiaomiMiMo/MiMo-V2-Flash", - "name": "MiMo V2 Flash", - "display_name": "MiMo V2 Flash", + "id": "qwen-vl-ocr", + "name": "Qwen Vl Ocr", + "display_name": "Qwen Vl Ocr", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 34096, + "output": 4096 }, "temperature": true, "tool_call": false, @@ -22060,55 +22079,50 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-10-28", + "last_updated": "2025-04-13", "cost": { - "input": 0.17, - "output": 0.65, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.717, + "output": 0.717 + } }, { - "id": "OpenGVLab/InternVL3-78B-TEE", - "name": "InternVL3 78B TEE", - "display_name": "InternVL3 78B TEE", + "id": "qwen-doc-turbo", + "name": "Qwen Doc Turbo", + "display_name": "Qwen Doc Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-01-06", - "last_updated": "2025-01-06", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01", + "last_updated": "2024-01", "cost": { - "input": 0.1, - "output": 0.39 - }, - "type": "chat" + "input": 0.087, + "output": 0.144 + } }, { - "id": "openai/gpt-oss-120b-TEE", - "name": "gpt oss 120b TEE", - "display_name": "gpt oss 120b TEE", + "id": "qwen-deep-research", + "name": "Qwen Deep Research", + "display_name": "Qwen Deep Research", "modalities": { "input": [ "text" @@ -22118,34 +22132,28 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01", + "last_updated": "2024-01", "cost": { - "input": 0.04, - "output": 0.18, - "reasoning": 0.27, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 7.742, + "output": 23.367 + } }, { - "id": "openai/gpt-oss-20b", - "name": "gpt oss 20b", - "display_name": "gpt oss 20b", + "id": "kimi-k2-thinking", + "name": "Moonshot Kimi K2 Thinking", + "display_name": "Moonshot Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -22155,8 +22163,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -22166,27 +22174,20 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.02, - "output": 0.1, - "reasoning": 0.15, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.574, + "output": 2.294 + } }, { - "id": "chutesai/Mistral-Small-3.1-24B-Instruct-2503", - "name": "Mistral Small 3.1 24B Instruct 2503", - "display_name": "Mistral Small 3.1 24B Instruct 2503", + "id": "qwen2-5-72b-instruct", + "name": "Qwen2.5 72B Instruct", + "display_name": "Qwen2.5 72B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -22194,7 +22195,7 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 8192 }, "temperature": true, "tool_call": true, @@ -22203,58 +22204,56 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.03, - "output": 0.11, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.574, + "output": 1.721 + } }, { - "id": "chutesai/Mistral-Small-3.2-24B-Instruct-2506", - "name": "Mistral Small 3.2 24B Instruct 2506", - "display_name": "Mistral Small 3.2 24B Instruct 2506", + "id": "qwen3-omni-flash", + "name": "Qwen3-Omni Flash", + "display_name": "Qwen3-Omni Flash", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 65536, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.06, - "output": 0.18, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.058, + "output": 0.23, + "input_audio": 3.584, + "output_audio": 7.168 + } }, { - "id": "mistralai/Devstral-2-123B-Instruct-2512", - "name": "Devstral 2 123B Instruct 2512", - "display_name": "Devstral 2 123B Instruct 2512", + "id": "qwen-flash", + "name": "Qwen Flash", + "display_name": "Qwen Flash", "modalities": { "input": [ "text" @@ -22264,32 +22263,40 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.05, - "output": 0.22, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.022, + "output": 0.216 + } }, { - "id": "unsloth/Mistral-Nemo-Instruct-2407", - "name": "Mistral Nemo Instruct 2407", - "display_name": "Mistral Nemo Instruct 2407", + "id": "qwen3-8b", + "name": "Qwen3 8B", + "display_name": "Qwen3 8B", "modalities": { "input": [ "text" @@ -22300,67 +22307,70 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.02, - "output": 0.04, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.072, + "output": 0.287, + "reasoning": 0.717 + } }, { - "id": "unsloth/gemma-3-4b-it", - "name": "gemma 3 4b it", - "display_name": "gemma 3 4b it", + "id": "qwen3-omni-flash-realtime", + "name": "Qwen3-Omni Flash Realtime", + "display_name": "Qwen3-Omni Flash Realtime", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 96000, - "output": 96000 + "context": 65536, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.01, - "output": 0.03, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.23, + "output": 0.918, + "input_audio": 3.584, + "output_audio": 7.168 + } }, { - "id": "unsloth/Mistral-Small-24B-Instruct-2501", - "name": "Mistral Small 24B Instruct 2501", - "display_name": "Mistral Small 24B Instruct 2501", + "id": "qwen2-5-vl-72b-instruct", + "name": "Qwen2.5-VL 72B Instruct", + "display_name": "Qwen2.5-VL 72B Instruct", "modalities": { "input": [ "text", @@ -22371,8 +22381,8 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -22381,22 +22391,18 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.03, - "output": 0.11, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 2.294, + "output": 6.881 + } }, { - "id": "unsloth/gemma-3-12b-it", - "name": "gemma 3 12b it", - "display_name": "gemma 3 12b it", + "id": "qwen3-vl-plus", + "name": "Qwen3 VL Plus", + "display_name": "Qwen3 VL Plus", "modalities": { "input": [ "text", @@ -22407,68 +22413,79 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.03, - "output": 0.1, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.143353, + "output": 1.433525, + "reasoning": 4.300576 + } }, { - "id": "unsloth/gemma-3-27b-it", - "name": "gemma 3 27b it", - "display_name": "gemma 3 27b it", + "id": "qwen-plus", + "name": "Qwen Plus", + "display_name": "Qwen Plus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 96000, - "output": 96000 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-09-11", "cost": { - "input": 0.04, - "output": 0.15, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.115, + "output": 0.287, + "reasoning": 1.147 + } }, { - "id": "Qwen/Qwen3-30B-A3B", - "name": "Qwen3 30B A3B", - "display_name": "Qwen3 30B A3B", + "id": "qwen2-5-32b-instruct", + "name": "Qwen2.5 32B Instruct", + "display_name": "Qwen2.5 32B Instruct", "modalities": { "input": [ "text" @@ -22478,107 +22495,101 @@ ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.06, - "output": 0.22, - "reasoning": 0.33, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.287, + "output": 0.861 + } }, { - "id": "Qwen/Qwen3-14B", - "name": "Qwen3 14B", - "display_name": "Qwen3 14B", + "id": "qwen2-5-omni-7b", + "name": "Qwen2.5-Omni 7B", + "display_name": "Qwen2.5-Omni 7B", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 32768, + "output": 2048 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "knowledge": "2024-04", + "release_date": "2024-12", + "last_updated": "2024-12", "cost": { - "input": 0.05, - "output": 0.22, - "reasoning": 0.33, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.087, + "output": 0.345, + "input_audio": 5.448 + } }, { - "id": "Qwen/Qwen2.5-VL-32B-Instruct", - "name": "Qwen2.5 VL 32B Instruct", - "display_name": "Qwen2.5 VL 32B Instruct", + "id": "qwen-max", + "name": "Qwen Max", + "display_name": "Qwen Max", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 32768, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" + }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-04-03", + "last_updated": "2025-01-25", "cost": { - "input": 0.05, - "output": 0.22, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.345, + "output": 1.377 + } }, { - "id": "Qwen/Qwen3Guard-Gen-0.6B", - "name": "Qwen3Guard Gen 0.6B", - "display_name": "Qwen3Guard Gen 0.6B", + "id": "qwen-long", + "name": "Qwen Long", + "display_name": "Qwen Long", "modalities": { "input": [ "text" @@ -22588,8 +22599,8 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 1000000, + "output": 8192 }, "temperature": true, "tool_call": false, @@ -22597,23 +22608,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01-25", + "last_updated": "2025-01-25", "cost": { - "input": 0.01, - "output": 0.01, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.072, + "output": 0.287 + } }, { - "id": "Qwen/Qwen2.5-Coder-32B-Instruct", - "name": "Qwen2.5 Coder 32B Instruct", - "display_name": "Qwen2.5 Coder 32B Instruct", + "id": "qwen2-5-math-72b-instruct", + "name": "Qwen2.5-Math 72B Instruct", + "display_name": "Qwen2.5-Math 72B Instruct", "modalities": { "input": [ "text" @@ -22623,32 +22630,28 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 4096, + "output": 3072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.03, - "output": 0.11, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.574, + "output": 1.721 + } }, { - "id": "Qwen/Qwen2.5-72B-Instruct", - "name": "Qwen2.5 72B Instruct", - "display_name": "Qwen2.5 72B Instruct", + "id": "moonshot-kimi-k2-instruct", + "name": "Moonshot Kimi K2 Instruct", + "display_name": "Moonshot Kimi K2 Instruct", "modalities": { "input": [ "text" @@ -22658,8 +22661,8 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -22668,34 +22671,28 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.13, - "output": 0.52, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.574, + "output": 2.294 + } }, { - "id": "Qwen/Qwen2.5-VL-72B-Instruct-TEE", - "name": "Qwen2.5 VL 72B Instruct TEE", - "display_name": "Qwen2.5 VL 72B Instruct TEE", + "id": "tongyi-intent-detect-v3", + "name": "Tongyi Intent Detect V3", + "display_name": "Tongyi Intent Detect V3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 8192, + "output": 1024 }, "temperature": true, "tool_call": false, @@ -22703,23 +22700,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01", + "last_updated": "2024-01", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.058, + "output": 0.144 + } }, { - "id": "Qwen/Qwen3-235B-A22B", - "name": "Qwen3 235B A22B", - "display_name": "Qwen3 235B A22B", + "id": "qwen2-5-7b-instruct", + "name": "Qwen2.5 7B Instruct", + "display_name": "Qwen2.5 7B Instruct", "modalities": { "input": [ "text" @@ -22729,45 +22722,40 @@ ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.3, - "output": 1.2, - "reasoning": 1.8, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.072, + "output": 0.144 + } }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507-TEE", - "name": "Qwen3 235B A22B Instruct 2507 TEE", - "display_name": "Qwen3 235B A22B Instruct 2507 TEE", + "id": "qwen2-5-vl-7b-instruct", + "name": "Qwen2.5-VL 7B Instruct", + "display_name": "Qwen2.5-VL 7B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -22776,22 +22764,18 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.08, - "output": 0.55, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.287, + "output": 0.717 + } }, { - "id": "Qwen/Qwen3-32B", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "deepseek-v3-1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ "text" @@ -22801,70 +22785,58 @@ ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.08, - "output": 0.24, - "reasoning": 0.36, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.574, + "output": 1.721 + } }, { - "id": "Qwen/Qwen3-VL-235B-A22B-Instruct", - "name": "Qwen3 VL 235B A22B Instruct", - "display_name": "Qwen3 VL 235B A22B Instruct", + "id": "deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 32768, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.287, + "output": 0.861 + } }, { - "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "name": "Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen3 30B A3B Instruct 2507", + "id": "qwen3-235b-a22b", + "name": "Qwen3 235B A22B", + "display_name": "Qwen3 235B A22B", "modalities": { "input": [ "text" @@ -22874,32 +22846,35 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.08, - "output": 0.33, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.287, + "output": 1.147, + "reasoning": 2.868 + } }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8-TEE", - "name": "Qwen3 Coder 480B A35B Instruct FP8 TEE", - "display_name": "Qwen3 Coder 480B A35B Instruct FP8 TEE", + "id": "qwen2-5-coder-7b-instruct", + "name": "Qwen2.5-Coder 7B Instruct", + "display_name": "Qwen2.5-Coder 7B Instruct", "modalities": { "input": [ "text" @@ -22909,8 +22884,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -22919,22 +22894,18 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "knowledge": "2024-04", + "release_date": "2024-11", + "last_updated": "2024-11", "cost": { - "input": 0.22, - "output": 0.95, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.144, + "output": 0.287 + } }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "deepseek-r1-distill-qwen-14b", + "name": "DeepSeek R1 Distill Qwen 14B", + "display_name": "DeepSeek R1 Distill Qwen 14B", "modalities": { "input": [ "text" @@ -22944,8 +22915,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 32768, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -22954,35 +22925,32 @@ "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.11, - "output": 0.6, - "reasoning": 0.9, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.144, + "output": 0.431 + } }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "qwen-omni-turbo-realtime", + "name": "Qwen-Omni Turbo Realtime", + "display_name": "Qwen-Omni Turbo Realtime", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 32768, + "output": 2048 }, "temperature": true, "tool_call": true, @@ -22990,23 +22958,21 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-05-08", + "last_updated": "2025-05-08", "cost": { - "input": 0.1, - "output": 0.8, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.23, + "output": 0.918, + "input_audio": 3.584, + "output_audio": 7.168 + } }, { - "id": "zai-org/GLM-4.6-TEE", - "name": "GLM 4.6 TEE", - "display_name": "GLM 4.6 TEE", + "id": "qwen-math-turbo", + "name": "Qwen Math Turbo", + "display_name": "Qwen Math Turbo", "modalities": { "input": [ "text" @@ -23016,34 +22982,28 @@ ] }, "limit": { - "context": 202752, - "output": 65536 + "context": 4096, + "output": 3072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-09-19", + "last_updated": "2024-09-19", "cost": { - "input": 0.35, - "output": 1.5, - "reasoning": 2.25, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.287, + "output": 0.861 + } }, { - "id": "zai-org/GLM-4.5-TEE", - "name": "GLM 4.5 TEE", - "display_name": "GLM 4.5 TEE", + "id": "qwen-mt-turbo", + "name": "Qwen Mt Turbo", + "display_name": "Qwen Mt Turbo", "modalities": { "input": [ "text" @@ -23053,46 +23013,39 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 16384, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01", + "last_updated": "2025-01", "cost": { - "input": 0.35, - "output": 1.55, - "reasoning": 2.325, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.101, + "output": 0.28 + } }, { - "id": "zai-org/GLM-4.6V", - "name": "GLM 4.6V", - "display_name": "GLM 4.6V", + "id": "deepseek-r1-distill-llama-8b", + "name": "DeepSeek R1 Distill Llama 8B", + "display_name": "DeepSeek R1 Distill Llama 8B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 32768, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -23101,24 +23054,18 @@ "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.3, - "output": 0.9, - "reasoning": 1.35, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "zai-org/GLM-4.7-TEE", - "name": "GLM 4.7 TEE", - "display_name": "GLM 4.7 TEE", + "id": "qwen3-coder-480b-a35b-instruct", + "name": "Qwen3-Coder 480B-A35B Instruct", + "display_name": "Qwen3-Coder 480B-A35B Instruct", "modalities": { "input": [ "text" @@ -23128,34 +23075,28 @@ ] }, "limit": { - "context": 202752, - "output": 65535 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.4, - "output": 1.5, - "reasoning": 2.25, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.861, + "output": 3.441 + } }, { - "id": "zai-org/GLM-4.5-Air", - "name": "GLM 4.5 Air", - "display_name": "GLM 4.5 Air", + "id": "qwen-mt-plus", + "name": "Qwen Mt Plus", + "display_name": "Qwen Mt Plus", "modalities": { "input": [ "text" @@ -23165,34 +23106,28 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 16384, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01", + "last_updated": "2025-01", "cost": { - "input": 0.05, - "output": 0.22, - "reasoning": 0.33, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.259, + "output": 0.775 + } }, { - "id": "deepseek-ai/DeepSeek-V3-0324-TEE", - "name": "DeepSeek V3 0324 TEE", - "display_name": "DeepSeek V3 0324 TEE", + "id": "qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ "text" @@ -23202,7 +23137,7 @@ ] }, "limit": { - "context": 163840, + "context": 262144, "output": 65536 }, "temperature": true, @@ -23211,23 +23146,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.19, - "output": 0.87, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.861, + "output": 3.441 + } }, { - "id": "deepseek-ai/DeepSeek-V3.2-Speciale-TEE", - "name": "DeepSeek V3.2 Speciale TEE", - "display_name": "DeepSeek V3.2 Speciale TEE", + "id": "qwq-32b", + "name": "QwQ 32B", + "display_name": "QwQ 32B", "modalities": { "input": [ "text" @@ -23237,34 +23168,29 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "knowledge": "2024-04", + "release_date": "2024-12", + "last_updated": "2024-12", "cost": { - "input": 0.27, - "output": 0.41, - "reasoning": 0.615, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.287, + "output": 0.861 + } }, { - "id": "deepseek-ai/DeepSeek-V3.1-Terminus-TEE", - "name": "DeepSeek V3.1 Terminus TEE", - "display_name": "DeepSeek V3.1 Terminus TEE", + "id": "qwen2-5-math-7b-instruct", + "name": "Qwen2.5-Math 7B Instruct", + "display_name": "Qwen2.5-Math 7B Instruct", "modalities": { "input": [ "text" @@ -23274,34 +23200,28 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 4096, + "output": 3072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.23, - "output": 0.9, - "reasoning": 1.35, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.144, + "output": 0.287 + } }, { - "id": "deepseek-ai/DeepSeek-V3", - "name": "DeepSeek V3", - "display_name": "DeepSeek V3", + "id": "qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ "text" @@ -23311,32 +23231,34 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "knowledge": "2025-04", + "release_date": "2025-09", + "last_updated": "2025-09", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.144, + "output": 1.434 + } }, { - "id": "deepseek-ai/DeepSeek-R1-TEE", - "name": "DeepSeek R1 TEE", - "display_name": "DeepSeek R1 TEE", + "id": "deepseek-r1-distill-qwen-1-5b", + "name": "DeepSeek R1 Distill Qwen 1.5B", + "display_name": "DeepSeek R1 Distill Qwen 1.5B", "modalities": { "input": [ "text" @@ -23346,34 +23268,28 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 32768, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.3, - "output": 1.2, - "reasoning": 1.8, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ "text" @@ -23384,70 +23300,66 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.03, - "output": 0.11, - "reasoning": 0.165, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.287, + "output": 1.147, + "reasoning": 2.868 + } }, { - "id": "deepseek-ai/DeepSeek-R1-0528-TEE", - "name": "DeepSeek R1 0528 TEE", - "display_name": "DeepSeek R1 0528 TEE", + "id": "qwen-vl-plus", + "name": "Qwen-VL Plus", + "display_name": "Qwen-VL Plus", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-08-15", "cost": { - "input": 0.4, - "output": 1.75, - "reasoning": 2.625, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 0.115, + "output": 0.287 + } }, { - "id": "deepseek-ai/DeepSeek-V3.2-TEE", - "name": "DeepSeek V3.2 TEE", - "display_name": "DeepSeek V3.2 TEE", + "id": "qwen3-coder-plus", + "name": "Qwen3 Coder Plus", + "display_name": "Qwen3 Coder Plus", "modalities": { "input": [ "text" @@ -23457,34 +23369,28 @@ ] }, "limit": { - "context": 163840, + "context": 1000000, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.25, - "output": 0.38, - "reasoning": 0.57, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 - }, - "type": "chat" + "input": 1, + "output": 5 + } }, { - "id": "deepseek-ai/DeepSeek-V3.1-TEE", - "name": "DeepSeek V3.1 TEE", - "display_name": "DeepSeek V3.1 TEE", + "id": "qwen3-coder-plus-2025-09-23", + "name": "Qwen3 Coder Plus 2025 09 23", + "display_name": "Qwen3 Coder Plus 2025 09 23", "modalities": { "input": [ "text" @@ -23494,43 +23400,20 @@ ] }, "limit": { - "context": 163840, + "context": 1000000, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2025-12-29", - "cost": { - "input": 0.2, - "output": 0.8, - "reasoning": 1.2, - "cache_read": 0, - "cache_write": 0, - "input_audio": 0, - "output_audio": 0 + "supported": false }, - "type": "chat" - } - ] - }, - "kimi-for-coding": { - "id": "kimi-for-coding", - "name": "Kimi For Coding", - "display_name": "Kimi For Coding", - "api": "https://api.kimi.com/coding/v1", - "doc": "https://www.kimi.com/coding/docs/en/third-party-agents.html", - "models": [ + "attachment": false + }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "qwen3-coder-plus-2025-07-22", + "name": "Qwen3 Coder Plus 2025 07 22", + "display_name": "Qwen3 Coder Plus 2025 07 22", "modalities": { "input": [ "text" @@ -23540,41 +23423,20 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-11", - "last_updated": "2025-12", - "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "supported": false }, - "type": "chat" - } - ] - }, - "cortecs": { - "id": "cortecs", - "name": "Cortecs", - "display_name": "Cortecs", - "api": "https://api.cortecs.ai/v1", - "doc": "https://api.cortecs.ai/v1/models", - "models": [ + "attachment": false + }, { - "id": "nova-pro-v1", - "name": "Nova Pro 1.0", - "display_name": "Nova Pro 1.0", + "id": "qwen-vl-ocr-latest", + "name": "Qwen Vl Ocr Latest", + "display_name": "Qwen Vl Ocr Latest", "modalities": { "input": [ "text", @@ -23585,61 +23447,50 @@ ] }, "limit": { - "context": 300000, - "output": 5000 + "context": 34096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", - "cost": { - "input": 1.016, - "output": 4.061 - }, - "type": "chat" + "attachment": false }, { - "id": "devstral-2512", - "name": "Devstral 2 2512", - "display_name": "Devstral 2 2512", + "id": "qvq-max-2025-05-15", + "name": "Qvq Max 2025 05 15", + "display_name": "Qvq Max 2025 05 15", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": false, + "budget": { + "default": 16384, + "min": 0, + "max": 16384 + } }, - "type": "chat" + "attachment": false }, { - "id": "intellect-3", - "name": "INTELLECT 3", - "display_name": "INTELLECT 3", + "id": "qwen-turbo-latest", + "name": "Qwen Turbo Latest", + "display_name": "Qwen Turbo Latest", "modalities": { "input": [ "text" @@ -23649,65 +23500,55 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-11", - "release_date": "2025-11-26", - "last_updated": "2025-11-26", - "cost": { - "input": 0.219, - "output": 1.202 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "type": "chat" + "attachment": false }, { - "id": "claude-4-5-sonnet", - "name": "Claude 4.5 Sonnet", - "display_name": "Claude 4.5 Sonnet", + "id": "qwen-turbo-2024-09-19", + "name": "Qwen Turbo 2024 09 19", + "display_name": "Qwen Turbo 2024 09 19", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", - "cost": { - "input": 3.259, - "output": 16.296 + "supported": false }, - "type": "chat" + "attachment": false }, { - "id": "deepseek-v3-0324", - "name": "DeepSeek V3 0324", - "display_name": "DeepSeek V3 0324", + "id": "qwen-flash-2025-07-28", + "name": "Qwen Flash 2025 07 28", + "display_name": "Qwen Flash 2025 07 28", "modalities": { "input": [ "text" @@ -23717,29 +23558,32 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", - "cost": { - "input": 0.551, - "output": 1.654 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "type": "chat" + "attachment": false }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "qwen-plus-latest", + "name": "Qwen Plus Latest", + "display_name": "Qwen Plus Latest", "modalities": { "input": [ "text" @@ -23749,30 +23593,32 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", - "cost": { - "input": 0.656, - "output": 2.731 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "type": "chat" + "attachment": false }, { - "id": "kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "qwen-plus-2024-09-19", + "name": "Qwen Plus 2024 09 19", + "display_name": "Qwen Plus 2024 09 19", "modalities": { "input": [ "text" @@ -23782,95 +23628,90 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-07-11", - "last_updated": "2025-09-05", - "cost": { - "input": 0.551, - "output": 2.646 - }, - "type": "chat" + "attachment": false }, { - "id": "gpt-4.1", - "name": "GPT 4.1", - "display_name": "GPT 4.1", + "id": "qwen-plus-2025-07-14", + "name": "Qwen Plus 2025 07 14", + "display_name": "Qwen Plus 2025 07 14", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 2.354, - "output": 9.417 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "type": "chat" + "attachment": false }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "qwen-plus-2025-09-11", + "name": "Qwen Plus 2025 09 11", + "display_name": "Qwen Plus 2025 09 11", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-17", - "cost": { - "input": 1.654, - "output": 11.024 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "type": "chat" + "attachment": false }, { - "id": "gpt-oss-120b", - "name": "GPT Oss 120b", - "display_name": "GPT Oss 120b", + "id": "qwen-max-latest", + "name": "Qwen Max Latest", + "display_name": "Qwen Max Latest", "modalities": { "input": [ "text" @@ -23880,62 +23721,55 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-01", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 0, - "output": 0 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "type": "chat" + "attachment": false }, { - "id": "devstral-small-2512", - "name": "Devstral Small 2 2512", - "display_name": "Devstral Small 2 2512", + "id": "qwen-max-2024-09-19", + "name": "Qwen Max 2024 09 19", + "display_name": "Qwen Max 2024 09 19", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", - "cost": { - "input": 0, - "output": 0 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "type": "chat" + "attachment": false }, { - "id": "qwen3-coder-480b-a35b-instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "qwen-max-2024-04-28", + "name": "Qwen Max 2024 04 28", + "display_name": "Qwen Max 2024 04 28", "modalities": { "input": [ "text" @@ -23945,63 +23779,43 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 8000, + "output": 2000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", - "cost": { - "input": 0.441, - "output": 1.984 - }, - "type": "chat" + "attachment": false }, { - "id": "claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "qwen-max-2024-04-03", + "name": "Qwen Max 2024 04 03", + "display_name": "Qwen Max 2024 04 03", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 8000, + "output": 2000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "cost": { - "input": 3.307, - "output": 16.536 - }, - "type": "chat" + "attachment": false }, { - "id": "llama-3.1-405b-instruct", - "name": "Llama 3.1 405B Instruct", - "display_name": "Llama 3.1 405B Instruct", + "id": "qwen-max-2025-01-25", + "name": "Qwen Max 2025 01 25", + "display_name": "Qwen Max 2025 01 25", "modalities": { "input": [ "text" @@ -24011,29 +23825,26 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", - "cost": { - "input": 0, - "output": 0 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "type": "chat" + "attachment": false }, { - "id": "qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen3 Next 80B A3B Thinking", + "id": "qwen3-max-2025-09-23", + "name": "Qwen3 Max 20250923", + "display_name": "Qwen3 Max 20250923", "modalities": { "input": [ "text" @@ -24043,30 +23854,26 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-11", - "last_updated": "2025-09-11", - "cost": { - "input": 0.164, - "output": 1.311 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "type": "chat" + "attachment": false }, { - "id": "qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "qwen3-max-preview", + "name": "Qwen3 Max Preview", + "display_name": "Qwen3 Max Preview", "modalities": { "input": [ "text" @@ -24076,38 +23883,26 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-04-29", - "last_updated": "2025-04-29", - "cost": { - "input": 0.099, - "output": 0.33 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "type": "chat" - } - ] - }, - "github-models": { - "id": "github-models", - "name": "GitHub Models", - "display_name": "GitHub Models", - "api": "https://models.github.ai/inference", - "doc": "https://docs.github.com/en/github-models", - "models": [ + "attachment": false + }, { - "id": "core42/jais-30b-chat", - "name": "JAIS 30b Chat", - "display_name": "JAIS 30b Chat", + "id": "qwen3-235b-a22b-thinking-2507", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ "text" @@ -24117,30 +23912,26 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-03", - "release_date": "2023-08-30", - "last_updated": "2023-08-30", - "cost": { - "input": 0, - "output": 0 + "default": true, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "type": "chat" + "attachment": false }, { - "id": "xai/grok-3", - "name": "Grok 3", - "display_name": "Grok 3", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -24150,30 +23941,20 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-09", - "last_updated": "2024-12-09", - "cost": { - "input": 0, - "output": 0 + "supported": false }, - "type": "chat" + "attachment": false }, { - "id": "xai/grok-3-mini", - "name": "Grok 3 Mini", - "display_name": "Grok 3 Mini", + "id": "qwen3-30b-a3b-instruct-2507", + "name": "Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ "text" @@ -24183,30 +23964,20 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-09", - "last_updated": "2024-12-09", - "cost": { - "input": 0, - "output": 0 + "supported": false }, - "type": "chat" + "attachment": false }, { - "id": "cohere/cohere-command-r-08-2024", - "name": "Cohere Command R 08-2024", - "display_name": "Cohere Command R 08-2024", + "id": "qwen3-30b-a3b-thinking-2507", + "name": "Qwen3 30B A3B Thinking 2507", + "display_name": "Qwen3 30B A3B Thinking 2507", "modalities": { "input": [ "text" @@ -24216,30 +23987,26 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-08-01", - "last_updated": "2024-08-01", - "cost": { - "input": 0, - "output": 0 + "default": true, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "type": "chat" + "attachment": false }, { - "id": "cohere/cohere-command-a", - "name": "Cohere Command A", - "display_name": "Cohere Command A", + "id": "qwen3-30b-a3b", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", "modalities": { "input": [ "text" @@ -24249,30 +24016,26 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", - "cost": { - "input": 0, - "output": 0 + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "type": "chat" + "attachment": false }, { - "id": "cohere/cohere-command-r-plus-08-2024", - "name": "Cohere Command R+ 08-2024", - "display_name": "Cohere Command R+ 08-2024", + "id": "qwen3-4b", + "name": "Qwen3 4B", + "display_name": "Qwen3 4B", "modalities": { "input": [ "text" @@ -24282,30 +24045,26 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-08-01", - "last_updated": "2024-08-01", - "cost": { - "input": 0, - "output": 0 + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, - "type": "chat" + "attachment": false }, { - "id": "cohere/cohere-command-r", - "name": "Cohere Command R", - "display_name": "Cohere Command R", + "id": "qwen3-1.7b", + "name": "Qwen3 1.7B", + "display_name": "Qwen3 1.7B", "modalities": { "input": [ "text" @@ -24315,30 +24074,26 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-03-11", - "last_updated": "2024-08-01", - "cost": { - "input": 0, - "output": 0 + "default": true, + "budget": { + "default": 30720, + "min": 0, + "max": 30720 + } }, - "type": "chat" + "attachment": false }, { - "id": "cohere/cohere-command-r-plus", - "name": "Cohere Command R+", - "display_name": "Cohere Command R+", + "id": "qwen3-0.6b", + "name": "Qwen3 0.6B", + "display_name": "Qwen3 0.6B", "modalities": { "input": [ "text" @@ -24348,63 +24103,56 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-04-04", - "last_updated": "2024-08-01", - "cost": { - "input": 0, - "output": 0 + "default": true, + "budget": { + "default": 30720, + "min": 0, + "max": 30720 + } }, - "type": "chat" + "attachment": false }, { - "id": "deepseek/deepseek-r1-0528", - "name": "DeepSeek-R1-0528", - "display_name": "DeepSeek-R1-0528", + "id": "qwen3-vl-plus-2025-09-23", + "name": "Qwen3 VL Plus 2025 09 23", + "display_name": "Qwen3 VL Plus 2025 09 23", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 262144, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", - "cost": { - "input": 0, - "output": 0 + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "type": "chat" + "attachment": false }, { - "id": "deepseek/deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "qwq-plus-latest", + "name": "QwQ Plus Latest", + "display_name": "QwQ Plus Latest", "modalities": { "input": [ "text" @@ -24414,30 +24162,38 @@ ] }, "limit": { - "context": 65536, + "context": 131072, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 32768, + "min": 0, + "max": 32768 + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", - "cost": { - "input": 0, - "output": 0 + "search": { + "supported": false }, - "type": "chat" - }, + "attachment": false + } + ] + }, + "novita-ai": { + "id": "novita-ai", + "name": "NovitaAI", + "display_name": "NovitaAI", + "api": "https://api.novita.ai/openai", + "doc": "https://novita.ai/docs/guides/introduction", + "models": [ { - "id": "deepseek/deepseek-v3-0324", - "name": "DeepSeek-V3-0324", - "display_name": "DeepSeek-V3-0324", + "id": "baichuan/baichuan-m2-32b", + "name": "baichuan-m2-32b", + "display_name": "baichuan-m2-32b", "modalities": { "input": [ "text" @@ -24447,42 +24203,41 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "knowledge": "2024-12", + "release_date": "2025-08-13", + "last_updated": "2025-08-13", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.07, + "output": 0.07 + } }, { - "id": "mistral-ai/mistral-medium-2505", - "name": "Mistral Medium 3 (25.05)", - "display_name": "Mistral Medium 3 (25.05)", + "id": "moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -24490,21 +24245,21 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2025-05-01", - "last_updated": "2025-05-01", + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.6, + "output": 3, + "cache_read": 0.1 + } }, { - "id": "mistral-ai/ministral-3b", - "name": "Ministral 3B", - "display_name": "Ministral 3B", + "id": "moonshotai/kimi-k2-0905", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ "text" @@ -24514,30 +24269,28 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-03", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.6, + "output": 2.5 + } }, { - "id": "mistral-ai/mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -24547,8 +24300,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -24558,19 +24311,17 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-03", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2025-11-07", + "last_updated": "2025-11-07", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.6, + "output": 2.5 + } }, { - "id": "mistral-ai/mistral-large-2411", - "name": "Mistral Large 24.11", - "display_name": "Mistral Large 24.11", + "id": "moonshotai/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ "text" @@ -24580,30 +24331,27 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "open_weights": true, + "release_date": "2025-07-11", + "last_updated": "2025-07-11", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.57, + "output": 2.3 + } }, { - "id": "mistral-ai/codestral-2501", - "name": "Codestral 25.01", - "display_name": "Codestral 25.01", + "id": "nousresearch/hermes-2-pro-llama-3-8b", + "name": "Hermes 2 Pro Llama 3 8B", + "display_name": "Hermes 2 Pro Llama 3 8B", "modalities": { "input": [ "text" @@ -24613,30 +24361,27 @@ ] }, "limit": { - "context": 32000, + "context": 8192, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "release_date": "2024-06-27", + "last_updated": "2024-06-27", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.14, + "output": 0.14 + } }, { - "id": "mistral-ai/mistral-small-2503", - "name": "Mistral Small 3.1", - "display_name": "Mistral Small 3.1", + "id": "paddlepaddle/paddleocr-vl", + "name": "PaddleOCR-VL", + "display_name": "PaddleOCR-VL", "modalities": { "input": [ "text", @@ -24647,30 +24392,27 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2025-03-01", - "last_updated": "2025-03-01", + "attachment": true, + "open_weights": true, + "release_date": "2025-10-22", + "last_updated": "2025-10-22", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.02, + "output": 0.02 + } }, { - "id": "microsoft/phi-3-medium-128k-instruct", - "name": "Phi-3-medium instruct (128k)", - "display_name": "Phi-3-medium instruct (128k)", + "id": "kwaipilot/kat-coder", + "name": "KAT-Coder-Pro V1(Free)", + "display_name": "KAT-Coder-Pro V1(Free)", "modalities": { "input": [ "text" @@ -24680,30 +24422,27 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "microsoft/phi-3-mini-4k-instruct", - "name": "Phi-3-mini instruct (4k)", - "display_name": "Phi-3-mini instruct (4k)", + "id": "kwaipilot/kat-coder-pro", + "name": "Kat Coder Pro", + "display_name": "Kat Coder Pro", "modalities": { "input": [ "text" @@ -24713,30 +24452,28 @@ ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 256000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "release_date": "2026-01-05", + "last_updated": "2026-01-05", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 + } }, { - "id": "microsoft/phi-3-small-128k-instruct", - "name": "Phi-3-small instruct (128k)", - "display_name": "Phi-3-small instruct (128k)", + "id": "xiaomimimo/mimo-v2-flash", + "name": "XiaomiMiMo/MiMo-V2-Flash", + "display_name": "XiaomiMiMo/MiMo-V2-Flash", "modalities": { "input": [ "text" @@ -24746,8 +24483,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -24757,19 +24494,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "knowledge": "2024-12", + "release_date": "2025-12-19", + "last_updated": "2025-12-19", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.1, + "output": 0.3, + "cache_read": 0.3 + } }, { - "id": "microsoft/phi-3.5-vision-instruct", - "name": "Phi-3.5-vision instruct (128k)", - "display_name": "Phi-3.5-vision instruct (128k)", + "id": "deepseek/deepseek-ocr-2", + "name": "deepseek/deepseek-ocr-2", + "display_name": "deepseek/deepseek-ocr-2", "modalities": { "input": [ "text", @@ -24780,30 +24517,26 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.03, + "output": 0.03 + } }, { - "id": "microsoft/phi-4", - "name": "Phi-4", - "display_name": "Phi-4", + "id": "deepseek/deepseek-prover-v2-671b", + "name": "Deepseek Prover V2 671B", + "display_name": "Deepseek Prover V2 671B", "modalities": { "input": [ "text" @@ -24813,30 +24546,27 @@ ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 160000, + "output": 160000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "release_date": "2025-04-30", + "last_updated": "2025-04-30", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.7, + "output": 2.5 + } }, { - "id": "microsoft/phi-4-mini-reasoning", - "name": "Phi-4-mini-reasoning", - "display_name": "Phi-4-mini-reasoning", + "id": "deepseek/deepseek-r1-0528", + "name": "DeepSeek R1 0528", + "display_name": "DeepSeek R1 0528", "modalities": { "input": [ "text" @@ -24846,8 +24576,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 163840, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -24857,19 +24587,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2024-07", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.7, + "output": 2.5, + "cache_read": 0.35 + } }, { - "id": "microsoft/phi-3-small-8k-instruct", - "name": "Phi-3-small instruct (8k)", - "display_name": "Phi-3-small instruct (8k)", + "id": "deepseek/deepseek-r1-0528-qwen3-8b", + "name": "DeepSeek R1 0528 Qwen3 8B", + "display_name": "DeepSeek R1 0528 Qwen3 8B", "modalities": { "input": [ "text" @@ -24879,30 +24609,28 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 128000, + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "release_date": "2025-05-29", + "last_updated": "2025-05-29", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.06, + "output": 0.09 + } }, { - "id": "microsoft/phi-3.5-mini-instruct", - "name": "Phi-3.5-mini instruct (128k)", - "display_name": "Phi-3.5-mini instruct (128k)", + "id": "deepseek/deepseek-v3.1-terminus", + "name": "Deepseek V3.1 Terminus", + "display_name": "Deepseek V3.1 Terminus", "modalities": { "input": [ "text" @@ -24912,8 +24640,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -24923,32 +24651,29 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.27, + "output": 1, + "cache_read": 0.135 + } }, { - "id": "microsoft/phi-4-multimodal-instruct", - "name": "Phi-4-multimodal-instruct", - "display_name": "Phi-4-multimodal-instruct", + "id": "deepseek/deepseek-v3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -24958,19 +24683,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.27, + "output": 1, + "cache_read": 0.135 + } }, { - "id": "microsoft/phi-3-mini-128k-instruct", - "name": "Phi-3-mini instruct (128k)", - "display_name": "Phi-3-mini instruct (128k)", + "id": "deepseek/deepseek-v3-0324", + "name": "DeepSeek V3 0324", + "display_name": "DeepSeek V3 0324", "modalities": { "input": [ "text" @@ -24980,30 +24704,29 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "knowledge": "2024-07", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.27, + "output": 1.12, + "cache_read": 0.135 + } }, { - "id": "microsoft/phi-3.5-moe-instruct", - "name": "Phi-3.5-MoE instruct (128k)", - "display_name": "Phi-3.5-MoE instruct (128k)", + "id": "deepseek/deepseek-r1-turbo", + "name": "DeepSeek R1 (Turbo)\t", + "display_name": "DeepSeek R1 (Turbo)\t", "modalities": { "input": [ "text" @@ -25013,8 +24736,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 64000, + "output": 16000 }, "temperature": true, "tool_call": true, @@ -25024,19 +24747,17 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "release_date": "2025-03-05", + "last_updated": "2025-03-05", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.7, + "output": 2.5 + } }, { - "id": "microsoft/phi-4-mini-instruct", - "name": "Phi-4-mini-instruct", - "display_name": "Phi-4-mini-instruct", + "id": "deepseek/deepseek-v3.2-exp", + "name": "Deepseek V3.2 Exp", + "display_name": "Deepseek V3.2 Exp", "modalities": { "input": [ "text" @@ -25046,8 +24767,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -25057,19 +24778,17 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.27, + "output": 0.41 + } }, { - "id": "microsoft/phi-3-medium-4k-instruct", - "name": "Phi-3-medium instruct (4k)", - "display_name": "Phi-3-medium instruct (4k)", + "id": "deepseek/deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill LLama 70B", + "display_name": "DeepSeek R1 Distill LLama 70B", "modalities": { "input": [ "text" @@ -25079,63 +24798,59 @@ ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.8, + "output": 0.8 + } }, { - "id": "microsoft/phi-4-reasoning", - "name": "Phi-4-Reasoning", - "display_name": "Phi-4-Reasoning", + "id": "deepseek/deepseek-ocr", + "name": "DeepSeek-OCR", + "display_name": "DeepSeek-OCR", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "release_date": "2025-10-24", + "last_updated": "2025-10-24", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.03, + "output": 0.03 + } }, { - "id": "microsoft/mai-ds-r1", - "name": "MAI-DS-R1", - "display_name": "MAI-DS-R1", + "id": "deepseek/deepseek-v3.2", + "name": "Deepseek V3.2", + "display_name": "Deepseek V3.2", "modalities": { "input": [ "text" @@ -25145,8 +24860,8 @@ ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -25155,86 +24870,79 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "open_weights": true, + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.269, + "output": 0.4, + "cache_read": 0.1345 + } }, { - "id": "openai/gpt-4.1-nano", - "name": "GPT-4.1-nano", - "display_name": "GPT-4.1-nano", + "id": "deepseek/deepseek-v3-turbo", + "name": "DeepSeek V3 (Turbo)\t", + "display_name": "DeepSeek V3 (Turbo)\t", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 64000, + "output": 16000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "release_date": "2025-03-05", + "last_updated": "2025-03-05", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.4, + "output": 1.3 + } }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT-4.1-mini", - "display_name": "GPT-4.1-mini", + "id": "sao10k/l3-8b-lunaris", + "name": "Sao10k L3 8B Lunaris\t", + "display_name": "Sao10k L3 8B Lunaris\t", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "release_date": "2024-11-28", + "last_updated": "2024-11-28", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.05, + "output": 0.05 + } }, { - "id": "openai/o1-preview", - "name": "OpenAI o1-preview", - "display_name": "OpenAI o1-preview", + "id": "sao10k/L3-8B-Stheno-v3.2", + "name": "L3 8B Stheno V3.2", + "display_name": "L3 8B Stheno V3.2", "modalities": { "input": [ "text" @@ -25244,30 +24952,27 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 8192, + "output": 32000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "open_weights": true, + "release_date": "2024-11-29", + "last_updated": "2024-11-29", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.05, + "output": 0.05 + } }, { - "id": "openai/o3-mini", - "name": "OpenAI o3-mini", - "display_name": "OpenAI o3-mini", + "id": "sao10k/l31-70b-euryale-v2.2", + "name": "L31 70B Euryale V2.2", + "display_name": "L31 70B Euryale V2.2", "modalities": { "input": [ "text" @@ -25277,64 +24982,57 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 8192, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "open_weights": true, + "release_date": "2024-09-19", + "last_updated": "2024-09-19", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 1.48, + "output": 1.48 + } }, { - "id": "openai/gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "sao10k/l3-70b-euryale-v2.1", + "name": "L3 70B Euryale V2.1\t", + "display_name": "L3 70B Euryale V2.1\t", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "attachment": false, + "open_weights": true, + "release_date": "2024-06-18", + "last_updated": "2024-06-18", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 1.48, + "output": 1.48 + } }, { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "skywork/r1v4-lite", + "name": "Skywork R1V4-Lite", + "display_name": "Skywork R1V4-Lite", "modalities": { "input": [ "text", @@ -25345,97 +25043,90 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.2, + "output": 0.6 + } }, { - "id": "openai/o4-mini", - "name": "OpenAI o4-mini", - "display_name": "OpenAI o4-mini", + "id": "minimaxai/minimax-m1-80k", + "name": "MiniMax M1", + "display_name": "MiniMax M1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1000000, + "output": 40000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "open_weights": true, + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.55, + "output": 2.2 + } }, { - "id": "openai/o1", - "name": "OpenAI o1", - "display_name": "OpenAI o1", + "id": "minimax/minimax-m2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 204800, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2024-09-12", - "last_updated": "2024-12-17", + "open_weights": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 + } }, { - "id": "openai/o1-mini", - "name": "OpenAI o1-mini", - "display_name": "OpenAI o1-mini", + "id": "minimax/minimax-m2.1", + "name": "Minimax M2.1", + "display_name": "Minimax M2.1", "modalities": { "input": [ "text" @@ -25445,30 +25136,28 @@ ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 204800, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2024-09-12", - "last_updated": "2024-12-17", + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 + } }, { - "id": "openai/o3", - "name": "OpenAI o3", - "display_name": "OpenAI o3", + "id": "google/gemma-3-27b-it", + "name": "Gemma 3 27B", + "display_name": "Gemma 3 27B", "modalities": { "input": [ "text", @@ -25479,109 +25168,100 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 98304, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "attachment": true, + "open_weights": true, + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.119, + "output": 0.2 + } }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "microsoft/wizardlm-2-8x22b", + "name": "Wizardlm 2 8x22B", + "display_name": "Wizardlm 2 8x22B", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 65535, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "attachment": false, + "open_weights": true, + "release_date": "2024-04-24", + "last_updated": "2024-04-24", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.62, + "output": 0.62 + } }, { - "id": "meta/llama-3.2-11b-vision-instruct", - "name": "Llama-3.2-11B-Vision-Instruct", - "display_name": "Llama-3.2-11B-Vision-Instruct", + "id": "openai/gpt-oss-20b", + "name": "OpenAI: GPT OSS 20B", + "display_name": "OpenAI: GPT OSS 20B", "modalities": { "input": [ "text", - "image", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "release_date": "2025-08-06", + "last_updated": "2025-08-06", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.04, + "output": 0.15 + } }, { - "id": "meta/meta-llama-3.1-405b-instruct", - "name": "Meta-Llama-3.1-405B-Instruct", - "display_name": "Meta-Llama-3.1-405B-Instruct", + "id": "openai/gpt-oss-120b", + "name": "OpenAI GPT OSS 120B", + "display_name": "OpenAI GPT OSS 120B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 131072, "output": 32768 }, "temperature": true, @@ -25590,66 +25270,62 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2025-08-06", + "last_updated": "2025-08-06", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.05, + "output": 0.25 + } }, { - "id": "meta/llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama 4 Maverick 17B 128E Instruct FP8", - "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", + "id": "gryphe/mythomax-l2-13b", + "name": "Mythomax L2 13B", + "display_name": "Mythomax L2 13B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 4096, + "output": 3200 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "release_date": "2024-04-25", + "last_updated": "2024-04-25", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.09, + "output": 0.09 + } }, { - "id": "meta/meta-llama-3-70b-instruct", - "name": "Meta-Llama-3-70B-Instruct", - "display_name": "Meta-Llama-3-70B-Instruct", + "id": "baidu/ernie-4.5-vl-28b-a3b-thinking", + "name": "ERNIE-4.5-VL-28B-A3B-Thinking", + "display_name": "ERNIE-4.5-VL-28B-A3B-Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -25657,21 +25333,19 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "release_date": "2025-11-26", + "last_updated": "2025-11-26", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.39, + "output": 0.39 + } }, { - "id": "meta/meta-llama-3.1-70b-instruct", - "name": "Meta-Llama-3.1-70B-Instruct", - "display_name": "Meta-Llama-3.1-70B-Instruct", + "id": "baidu/ernie-4.5-300b-a47b-paddle", + "name": "ERNIE 4.5 300B A47B", + "display_name": "ERNIE 4.5 300B A47B", "modalities": { "input": [ "text" @@ -25681,30 +25355,27 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 123000, + "output": 12000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2025-06-30", + "last_updated": "2025-06-30", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.28, + "output": 1.1 + } }, { - "id": "meta/llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "baidu/ernie-4.5-21B-a3b", + "name": "ERNIE 4.5 21B A3B", + "display_name": "ERNIE 4.5 21B A3B", "modalities": { "input": [ "text" @@ -25714,98 +25385,92 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 120000, + "output": 8000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "knowledge": "2025-03", + "release_date": "2025-06-30", + "last_updated": "2025-06-30", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.07, + "output": 0.28 + } }, { - "id": "meta/llama-3.2-90b-vision-instruct", - "name": "Llama-3.2-90B-Vision-Instruct", - "display_name": "Llama-3.2-90B-Vision-Instruct", + "id": "baidu/ernie-4.5-21B-a3b-thinking", + "name": "ERNIE-4.5-21B-A3B-Thinking", + "display_name": "ERNIE-4.5-21B-A3B-Thinking", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "knowledge": "2025-03", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.07, + "output": 0.28 + } }, { - "id": "meta/meta-llama-3-8b-instruct", - "name": "Meta-Llama-3-8B-Instruct", - "display_name": "Meta-Llama-3-8B-Instruct", + "id": "baidu/ernie-4.5-vl-424b-a47b", + "name": "ERNIE 4.5 VL 424B A47B", + "display_name": "ERNIE 4.5 VL 424B A47B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 123000, + "output": 16000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "release_date": "2025-06-30", + "last_updated": "2025-06-30", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.42, + "output": 1.25 + } }, { - "id": "meta/llama-4-scout-17b-16e-instruct", - "name": "Llama 4 Scout 17B 16E Instruct", - "display_name": "Llama 4 Scout 17B 16E Instruct", + "id": "baidu/ernie-4.5-vl-28b-a3b", + "name": "ERNIE 4.5 VL 28B A3B", + "display_name": "ERNIE 4.5 VL 28B A3B", "modalities": { "input": [ "text", @@ -25816,8 +25481,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 30000, + "output": 8000 }, "temperature": true, "tool_call": true, @@ -25825,54 +25490,51 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "release_date": "2025-06-30", + "last_updated": "2025-06-30", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 1.4, + "output": 5.6 + } }, { - "id": "meta/meta-llama-3.1-8b-instruct", - "name": "Meta-Llama-3.1-8B-Instruct", - "display_name": "Meta-Llama-3.1-8B-Instruct", + "id": "qwen/qwen3-vl-30b-a3b-thinking", + "name": "qwen/qwen3-vl-30b-a3b-thinking", + "display_name": "qwen/qwen3-vl-30b-a3b-thinking", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 131072, "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2025-10-11", + "last_updated": "2025-10-11", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.2, + "output": 1 + } }, { - "id": "ai21-labs/ai21-jamba-1.5-large", - "name": "AI21 Jamba 1.5 Large", - "display_name": "AI21 Jamba 1.5 Large", + "id": "qwen/qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -25882,41 +25544,42 @@ ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-08-29", - "last_updated": "2024-08-29", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-22", + "last_updated": "2025-07-22", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.09, + "output": 0.58 + } }, { - "id": "ai21-labs/ai21-jamba-1.5-mini", - "name": "AI21 Jamba 1.5 Mini", - "display_name": "AI21 Jamba 1.5 Mini", + "id": "qwen/qwen3-omni-30b-a3b-thinking", + "name": "Qwen3 Omni 30B A3B Thinking", + "display_name": "Qwen3 Omni 30B A3B Thinking", "modalities": { "input": [ - "text" + "text", + "audio", + "video", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 65536, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -25924,29 +25587,21 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-08-29", - "last_updated": "2024-08-29", + "attachment": true, + "open_weights": true, + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - } - ] - }, - "togetherai": { - "id": "togetherai", - "name": "Together AI", - "display_name": "Together AI", - "doc": "https://docs.together.ai/docs/serverless-models", - "models": [ + "input": 0.25, + "output": 0.97, + "input_audio": 2.2, + "output_audio": 1.788 + } + }, { - "id": "moonshotai/Kimi-K2-Instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "qwen/qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ "text" @@ -25966,19 +25621,17 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-14", - "last_updated": "2025-07-14", + "release_date": "2025-09-10", + "last_updated": "2025-09-10", "cost": { - "input": 1, - "output": 3 - }, - "type": "chat" + "input": 0.15, + "output": 1.5 + } }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "qwen/qwen3-8b-fp8", + "name": "Qwen3 8B", + "display_name": "Qwen3 8B", "modalities": { "input": [ "text" @@ -25988,33 +25641,33 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 20000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 1.2, - "output": 4 - }, - "type": "chat" + "input": 0.035, + "output": 0.138 + } }, { - "id": "essentialai/Rnj-1-Instruct", - "name": "Rnj-1 Instruct", - "display_name": "Rnj-1 Instruct", + "id": "qwen/qwen2.5-vl-72b-instruct", + "name": "Qwen2.5 VL 72B Instruct", + "display_name": "Qwen2.5 VL 72B Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -26025,25 +25678,23 @@ "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-12-05", - "last_updated": "2025-12-05", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 0.15, - "output": 0.15 - }, - "type": "chat" + "input": 0.8, + "output": 0.8 + } }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "qwen/qwen3-4b-fp8", + "name": "Qwen3 4B", + "display_name": "Qwen3 4B", "modalities": { "input": [ "text" @@ -26053,30 +25704,28 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 20000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 0.15, - "output": 0.6 - }, - "type": "chat" + "input": 0.03, + "output": 0.03 + } }, { - "id": "meta-llama/Llama-3.3-70B-Instruct-Turbo", - "name": "Llama 3.3 70B", - "display_name": "Llama 3.3 70B", + "id": "qwen/qwen3-coder-30b-a3b-instruct", + "name": "Qwen3 Coder 30b A3B Instruct", + "display_name": "Qwen3 Coder 30b A3B Instruct", "modalities": { "input": [ "text" @@ -26086,8 +25735,8 @@ ] }, "limit": { - "context": 131072, - "output": 66536 + "context": 160000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -26096,51 +25745,49 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-10-09", + "last_updated": "2025-10-09", "cost": { - "input": 0.88, - "output": 0.88 - }, - "type": "chat" + "input": 0.07, + "output": 0.27 + } }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "qwen/qwen3-vl-8b-instruct", + "name": "qwen/qwen3-vl-8b-instruct", + "display_name": "qwen/qwen3-vl-8b-instruct", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "release_date": "2025-10-17", + "last_updated": "2025-10-17", "cost": { - "input": 2, - "output": 2 - }, - "type": "chat" + "input": 0.08, + "output": 0.5 + } }, { - "id": "zai-org/GLM-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "qwen/qwen3-235b-a22b-thinking-2507", + "name": "Qwen3 235B A22b Thinking 2507", + "display_name": "Qwen3 235B A22b Thinking 2507", "modalities": { "input": [ "text" @@ -26150,29 +25797,29 @@ ] }, "limit": { - "context": 200000, + "context": 131072, "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-09", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 0.6, - "output": 2.2 - }, - "type": "chat" + "input": 0.3, + "output": 3 + } }, { - "id": "deepseek-ai/DeepSeek-R1", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", + "id": "qwen/qwen2.5-7b-instruct", + "name": "Qwen2.5 7B Instruct", + "display_name": "Qwen2.5 7B Instruct", "modalities": { "input": [ "text" @@ -26182,30 +25829,27 @@ ] }, "limit": { - "context": 163839, - "output": 12288 + "context": 32000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-12-26", - "last_updated": "2025-03-24", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 3, - "output": 7 - }, - "type": "chat" + "input": 0.07, + "output": 0.07 + } }, { - "id": "deepseek-ai/DeepSeek-V3", - "name": "DeepSeek V3", - "display_name": "DeepSeek V3", + "id": "qwen/qwen3-30b-a3b-fp8", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", "modalities": { "input": [ "text" @@ -26215,30 +25859,28 @@ ] }, "limit": { - "context": 131072, - "output": 12288 + "context": 40960, + "output": 20000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-05-29", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 1.25, - "output": 1.25 - }, - "type": "chat" + "input": 0.09, + "output": 0.45 + } }, { - "id": "deepseek-ai/DeepSeek-V3-1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "qwen/qwen3-32b-fp8", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ "text" @@ -26248,50 +25890,43 @@ ] }, "limit": { - "context": 131072, - "output": 12288 + "context": 40960, + "output": 20000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 0.6, - "output": 1.7 - }, - "type": "chat" - } - ] - }, - "azure": { - "id": "azure", - "name": "Azure", - "display_name": "Azure", - "doc": "https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models", - "models": [ + "input": 0.1, + "output": 0.45 + } + }, { - "id": "gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", + "id": "qwen/qwen3-omni-30b-a3b-instruct", + "name": "Qwen3 Omni 30B A3B Instruct", + "display_name": "Qwen3 Omni 30B A3B Instruct", "modalities": { "input": [ "text", + "video", + "audio", "image" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 65536, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -26299,21 +25934,21 @@ "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.03 - }, - "type": "chat" + "input": 0.25, + "output": 0.97, + "input_audio": 2.2, + "output_audio": 1.788 + } }, { - "id": "text-embedding-3-small", - "name": "text-embedding-3-small", - "display_name": "text-embedding-3-small", + "id": "qwen/qwen-2.5-72b-instruct", + "name": "Qwen 2.5 72B Instruct", + "display_name": "Qwen 2.5 72B Instruct", "modalities": { "input": [ "text" @@ -26323,129 +25958,122 @@ ] }, "limit": { - "context": 8191, - "output": 1536 + "context": 32000, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-10-15", + "last_updated": "2024-10-15", "cost": { - "input": 0.02, - "output": 0 - }, - "type": "embedding" + "input": 0.38, + "output": 0.4 + } }, { - "id": "grok-4-fast-non-reasoning", - "name": "Grok 4 Fast (Non-Reasoning)", - "display_name": "Grok 4 Fast (Non-Reasoning)", + "id": "qwen/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 - }, - "type": "chat" + "input": 0.3, + "output": 1.3 + } }, { - "id": "deepseek-r1-0528", - "name": "DeepSeek-R1-0528", - "display_name": "DeepSeek-R1-0528", + "id": "qwen/qwen3-vl-235b-a22b-thinking", + "name": "Qwen3 VL 235B A22B Thinking", + "display_name": "Qwen3 VL 235B A22B Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 1.35, - "output": 5.4 - }, - "type": "chat" + "input": 0.98, + "output": 3.95 + } }, { - "id": "grok-4-fast-reasoning", - "name": "Grok 4 Fast (Reasoning)", - "display_name": "Grok 4 Fast (Reasoning)", + "id": "qwen/qwen-mt-plus", + "name": "Qwen MT Plus", + "display_name": "Qwen MT Plus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 16384, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "attachment": false, + "open_weights": true, + "release_date": "2025-09-03", + "last_updated": "2025-09-03", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 - }, - "type": "chat" + "input": 0.25, + "output": 0.75 + } }, { - "id": "phi-3-medium-128k-instruct", - "name": "Phi-3-medium-instruct (128k)", - "display_name": "Phi-3-medium-instruct (128k)", + "id": "qwen/qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ "text" @@ -26455,198 +26083,184 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", - "cost": { - "input": 0.17, - "output": 0.68 - }, - "type": "chat" + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", + "cost": { + "input": 2.11, + "output": 8.45 + } }, { - "id": "gpt-4", - "name": "GPT-4", - "display_name": "GPT-4", + "id": "qwen/qwen3-vl-235b-a22b-instruct", + "name": "Qwen3 VL 235B A22B Instruct", + "display_name": "Qwen3 VL 235B A22B Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-03-14", - "last_updated": "2023-03-14", + "attachment": true, + "open_weights": true, + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 60, - "output": 120 - }, - "type": "chat" + "input": 0.3, + "output": 1.5 + } }, { - "id": "claude-opus-4-1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "qwen/qwen3-vl-30b-a3b-instruct", + "name": "qwen/qwen3-vl-30b-a3b-instruct", + "display_name": "qwen/qwen3-vl-30b-a3b-instruct", "modalities": { "input": [ "text", - "image", - "pdf" + "video", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "open_weights": true, + "release_date": "2025-10-11", + "last_updated": "2025-10-11", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" + "input": 0.2, + "output": 0.7 + } }, { - "id": "gpt-5.2-chat", - "name": "GPT-5.2 Chat", - "display_name": "GPT-5.2 Chat", + "id": "qwen/qwen3-coder-next", + "name": "Qwen3 Coder Next", + "display_name": "Qwen3 Coder Next", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-03", + "last_updated": "2026-02-03", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 - }, - "type": "chat" + "input": 0.2, + "output": 1.5 + } }, { - "id": "llama-3.2-11b-vision-instruct", - "name": "Llama-3.2-11B-Vision-Instruct", - "display_name": "Llama-3.2-11B-Vision-Instruct", + "id": "qwen/qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "release_date": "2025-09-10", + "last_updated": "2025-09-10", "cost": { - "input": 0.37, - "output": 0.37 - }, - "type": "chat" + "input": 0.15, + "output": 1.5 + } }, { - "id": "cohere-embed-v-4-0", - "name": "Embed v4", - "display_name": "Embed v4", + "id": "qwen/qwen3-235b-a22b-fp8", + "name": "Qwen3 235B A22B", + "display_name": "Qwen3 235B A22B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 1536 + "context": 40960, + "output": 20000 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 0.12, - "output": 0 - }, - "type": "chat" + "input": 0.2, + "output": 0.8 + } }, { - "id": "cohere-command-r-08-2024", - "name": "Command R", - "display_name": "Command R", + "id": "mistralai/mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text" @@ -26656,30 +26270,27 @@ ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 60288, + "output": 16000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "release_date": "2024-07-30", + "last_updated": "2024-07-30", "cost": { - "input": 0.15, - "output": 0.6 - }, - "type": "chat" + "input": 0.04, + "output": 0.17 + } }, { - "id": "grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "meta-llama/llama-3-70b-instruct", + "name": "Llama3 70B Instruct", + "display_name": "Llama3 70B Instruct", "modalities": { "input": [ "text" @@ -26689,32 +26300,27 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 8192, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "open_weights": true, + "release_date": "2024-04-25", + "last_updated": "2024-04-25", "cost": { - "input": 3, - "output": 15, - "reasoning": 15, - "cache_read": 0.75 - }, - "type": "chat" + "input": 0.51, + "output": 0.74 + } }, { - "id": "cohere-embed-v3-multilingual", - "name": "Embed v3 Multilingual", - "display_name": "Embed v3 Multilingual", + "id": "meta-llama/llama-3-8b-instruct", + "name": "Llama 3 8B Instruct", + "display_name": "Llama 3 8B Instruct", "modalities": { "input": [ "text" @@ -26724,28 +26330,27 @@ ] }, "limit": { - "context": 512, - "output": 1024 + "context": 8192, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2023-11-07", - "last_updated": "2023-11-07", + "release_date": "2024-04-25", + "last_updated": "2024-04-25", "cost": { - "input": 0.1, - "output": 0 - }, - "type": "chat" + "input": 0.04, + "output": 0.04 + } }, { - "id": "phi-4-mini", - "name": "Phi-4-mini", - "display_name": "Phi-4-mini", + "id": "meta-llama/llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ "text" @@ -26755,61 +26360,58 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "release_date": "2024-07-24", + "last_updated": "2024-07-24", "cost": { - "input": 0.075, - "output": 0.3 - }, - "type": "chat" + "input": 0.02, + "output": 0.05 + } }, { - "id": "gpt-4-32k", - "name": "GPT-4 32K", - "display_name": "GPT-4 32K", + "id": "meta-llama/llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama 4 Maverick Instruct", + "display_name": "Llama 4 Maverick Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 1048576, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-03-14", - "last_updated": "2023-03-14", + "attachment": true, + "open_weights": true, + "release_date": "2025-04-06", + "last_updated": "2025-04-06", "cost": { - "input": 60, - "output": 120 - }, - "type": "chat" + "input": 0.27, + "output": 0.85 + } }, { - "id": "meta-llama-3.1-405b-instruct", - "name": "Meta-Llama-3.1-405B-Instruct", - "display_name": "Meta-Llama-3.1-405B-Instruct", + "id": "meta-llama/llama-3.3-70b-instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ "text" @@ -26819,8 +26421,8 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 120000 }, "temperature": true, "tool_call": true, @@ -26830,18 +26432,48 @@ "attachment": false, "open_weights": true, "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2024-12-07", + "last_updated": "2024-12-07", "cost": { - "input": 5.33, - "output": 16 + "input": 0.135, + "output": 0.4 + } + }, + { + "id": "meta-llama/llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout Instruct", + "display_name": "Llama 4 Scout Instruct", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] }, - "type": "chat" + "limit": { + "context": 131072, + "output": 131072 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-04-06", + "last_updated": "2025-04-06", + "cost": { + "input": 0.18, + "output": 0.59 + } }, { - "id": "deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "zai-org/glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -26851,30 +26483,29 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 204800, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 1.35, - "output": 5.4 - }, - "type": "chat" + "input": 0.6, + "output": 2.2, + "cache_read": 0.11 + } }, { - "id": "grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "zai-org/glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ "text" @@ -26884,8 +26515,8 @@ ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -26894,59 +26525,52 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "open_weights": true, + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 - }, - "type": "chat" + "input": 0.6, + "output": 2.2, + "cache_read": 0.11 + } }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "zai-org/glm-4.7-flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { - "context": 400000, + "context": 200000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 - }, - "type": "chat" + "input": 0.07, + "output": 0.4, + "cache_read": 0.01 + } }, { - "id": "phi-3-mini-4k-instruct", - "name": "Phi-3-mini-instruct (4k)", - "display_name": "Phi-3-mini-instruct (4k)", + "id": "zai-org/glm-4.5-air", + "name": "GLM 4.5 Air", + "display_name": "GLM 4.5 Air", "modalities": { "input": [ "text" @@ -26956,42 +26580,42 @@ ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 131072, + "output": 98304 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "knowledge": "2025-04", + "release_date": "2025-10-13", + "last_updated": "2025-10-13", "cost": { "input": 0.13, - "output": 0.52 - }, - "type": "chat" + "output": 0.85 + } }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "zai-org/glm-4.5v", + "name": "GLM 4.5V", + "display_name": "GLM 4.5V", "modalities": { "input": [ "text", - "image", - "pdf" + "video", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 65536, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -27000,22 +26624,20 @@ "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2025-02-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 - }, - "type": "chat" + "input": 0.6, + "output": 1.8, + "cache_read": 0.11 + } }, { - "id": "deepseek-v3.2-speciale", - "name": "DeepSeek-V3.2-Speciale", - "display_name": "DeepSeek-V3.2-Speciale", + "id": "zai-org/glm-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ "text" @@ -27025,33 +26647,33 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 204800, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.28, - "output": 0.42 - }, - "type": "chat" + "input": 0.55, + "output": 2.2, + "cache_read": 0.11 + } }, { - "id": "mistral-medium-2505", - "name": "Mistral Medium 3", - "display_name": "Mistral Medium 3", + "id": "zai-org/glm-4.6v", + "name": "GLM 4.6V", + "display_name": "GLM 4.6V", "modalities": { "input": [ "text", + "video", "image" ], "output": [ @@ -27059,101 +26681,73 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0.4, - "output": 2 - }, - "type": "chat" + "input": 0.3, + "output": 0.9, + "cache_read": 0.055 + } }, { - "id": "claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "zai-org/autoglm-phone-9b-multilingual", + "name": "AutoGLM-Phone-9B-Multilingual", + "display_name": "AutoGLM-Phone-9B-Multilingual", "modalities": { "input": [ "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 200000, - "output": 64000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", - "cost": { - "input": 5, - "output": 25, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" - }, - { - "id": "phi-3-small-128k-instruct", - "name": "Phi-3-small-instruct (128k)", - "display_name": "Phi-3-small-instruct (128k)", - "modalities": { - "input": [ - "text" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 65536, + "output": 65536 }, "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "release_date": "2025-12-10", + "last_updated": "2025-12-10", "cost": { - "input": 0.15, - "output": 0.6 - }, - "type": "chat" - }, + "input": 0.035, + "output": 0.138 + } + } + ] + }, + "venice": { + "id": "venice", + "name": "Venice AI", + "display_name": "Venice AI", + "doc": "https://docs.venice.ai", + "models": [ { - "id": "cohere-command-a", - "name": "Command A", - "display_name": "Command A", + "id": "grok-41-fast", + "name": "Grok 4.1 Fast", + "display_name": "Grok 4.1 Fast", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -27161,7 +26755,7 @@ }, "limit": { "context": 256000, - "output": 8000 + "output": 64000 }, "temperature": true, "tool_call": true, @@ -27169,21 +26763,21 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "attachment": true, + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-12-01", + "last_updated": "2026-01-28", "cost": { - "input": 2.5, - "output": 10 - }, - "type": "chat" + "input": 0.5, + "output": 1.25, + "cache_read": 0.125 + } }, { - "id": "cohere-command-r-plus-08-2024", - "name": "Command R+", - "display_name": "Command R+", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen 3 235B A22B Instruct 2507", + "display_name": "Qwen 3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -27194,96 +26788,100 @@ }, "limit": { "context": 128000, - "output": 4000 + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "knowledge": "2025-07", + "release_date": "2025-04-29", + "last_updated": "2026-01-28", "cost": { - "input": 2.5, - "output": 10 - }, - "type": "chat" + "input": 0.15, + "output": 0.75 + } }, { - "id": "llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama 4 Maverick 17B 128E Instruct FP8", - "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-12-19", + "last_updated": "2026-01-28", "cost": { - "input": 0.25, - "output": 1 - }, - "type": "chat" + "input": 0.7, + "output": 3.75, + "cache_read": 0.07 + } }, { - "id": "gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "claude-opus-45", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 198000, + "output": 49500 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2025-03", + "release_date": "2025-12-06", + "last_updated": "2026-01-28", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 - }, - "type": "chat" + "input": 6, + "output": 30, + "cache_read": 0.6, + "cache_write": 7.5 + } }, { - "id": "gpt-5-chat", - "name": "GPT-5 Chat", - "display_name": "GPT-5 Chat", + "id": "mistral-31-24b", + "name": "Venice Medium", + "display_name": "Venice Medium", "modalities": { "input": [ "text", @@ -27295,30 +26893,27 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 32000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-10-24", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2025-03-18", + "last_updated": "2026-01-28", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 - }, - "type": "chat" + "input": 0.5, + "output": 2 + } }, { - "id": "deepseek-v3.1", - "name": "DeepSeek-V3.1", - "display_name": "DeepSeek-V3.1", + "id": "grok-code-fast-1", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ "text" @@ -27328,8 +26923,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -27338,20 +26933,19 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "open_weights": false, + "release_date": "2025-12-01", + "last_updated": "2026-01-28", "cost": { - "input": 0.56, - "output": 1.68 - }, - "type": "chat" + "input": 0.25, + "output": 1.87, + "cache_read": 0.03 + } }, { - "id": "phi-4", - "name": "Phi-4", - "display_name": "Phi-4", + "id": "zai-org-glm-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ "text" @@ -27361,75 +26955,73 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 198000, + "output": 49500 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2025-04", + "release_date": "2025-12-24", + "last_updated": "2026-01-28", "cost": { - "input": 0.125, - "output": 0.5 - }, - "type": "chat" + "input": 0.55, + "output": 2.65, + "cache_read": 0.11 + } }, { - "id": "phi-4-mini-reasoning", - "name": "Phi-4-mini-reasoning", - "display_name": "Phi-4-mini-reasoning", + "id": "qwen3-vl-235b-a22b", + "name": "Qwen3 VL 235B", + "display_name": "Qwen3 VL 235B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "release_date": "2026-01-16", + "last_updated": "2026-01-28", "cost": { - "input": 0.075, - "output": 0.3 - }, - "type": "chat" + "input": 0.25, + "output": 1.5 + } }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -27439,21 +27031,19 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" + "input": 6, + "output": 30, + "cache_read": 0.6, + "cache_write": 7.5 + } }, { - "id": "gpt-3.5-turbo-0125", - "name": "GPT-3.5 Turbo 0125", - "display_name": "GPT-3.5 Turbo 0125", + "id": "venice-uncensored", + "name": "Venice Uncensored 1.1", + "display_name": "Venice Uncensored 1.1", "modalities": { "input": [ "text" @@ -27463,8 +27053,8 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 32000, + "output": 8000 }, "temperature": true, "tool_call": false, @@ -27472,53 +27062,55 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2025-03-18", + "last_updated": "2026-01-28", "cost": { - "input": 0.5, - "output": 1.5 - }, - "type": "chat" + "input": 0.2, + "output": 0.9 + } }, { - "id": "grok-3", - "name": "Grok 3", - "display_name": "Grok 3", + "id": "gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 198000, + "output": 49500 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2024-04", + "release_date": "2025-12-02", + "last_updated": "2026-01-28", "cost": { - "input": 3, + "input": 2.5, "output": 15, - "cache_read": 0.75 - }, - "type": "chat" + "cache_read": 0.625 + } }, { - "id": "text-embedding-3-large", - "name": "text-embedding-3-large", - "display_name": "text-embedding-3-large", + "id": "openai-gpt-52", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text" @@ -27528,27 +27120,30 @@ ] }, "limit": { - "context": 8191, - "output": 3072 + "context": 256000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "knowledge": "2025-08-31", + "release_date": "2025-12-13", + "last_updated": "2026-01-28", "cost": { - "input": 0.13, - "output": 0 - }, - "type": "embedding" + "input": 2.19, + "output": 17.5, + "cache_read": 0.219 + } }, { - "id": "meta-llama-3-70b-instruct", - "name": "Meta-Llama-3-70B-Instruct", - "display_name": "Meta-Llama-3-70B-Instruct", + "id": "qwen3-4b", + "name": "Venice Small", + "display_name": "Venice Small", "modalities": { "input": [ "text" @@ -27558,29 +27153,29 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 32000, + "output": 8000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "knowledge": "2024-07", + "release_date": "2025-04-29", + "last_updated": "2026-01-28", "cost": { - "input": 2.68, - "output": 3.54 - }, - "type": "chat" + "input": 0.05, + "output": 0.15 + } }, { - "id": "deepseek-v3-0324", - "name": "DeepSeek-V3-0324", - "display_name": "DeepSeek-V3-0324", + "id": "llama-3.3-70b", + "name": "Llama 3.3 70B", + "display_name": "Llama 3.3 70B", "modalities": { "input": [ "text" @@ -27590,8 +27185,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -27600,51 +27195,53 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "knowledge": "2023-12", + "release_date": "2025-04-06", + "last_updated": "2026-01-28", "cost": { - "input": 1.14, - "output": 4.56 - }, - "type": "chat" + "input": 0.7, + "output": 2.8 + } }, { - "id": "phi-3-small-8k-instruct", - "name": "Phi-3-small-instruct (8k)", - "display_name": "Phi-3-small-instruct (8k)", + "id": "claude-sonnet-45", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 198000, + "output": 49500 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-09", + "release_date": "2025-01-15", + "last_updated": "2026-01-28", "cost": { - "input": 0.15, - "output": 0.6 - }, - "type": "chat" + "input": 3.75, + "output": 18.75, + "cache_read": 0.375, + "cache_write": 4.69 + } }, { - "id": "meta-llama-3.1-70b-instruct", - "name": "Meta-Llama-3.1-70B-Instruct", - "display_name": "Meta-Llama-3.1-70B-Instruct", + "id": "openai-gpt-oss-120b", + "name": "OpenAI GPT OSS 120B", + "display_name": "OpenAI GPT OSS 120B", "modalities": { "input": [ "text" @@ -27655,7 +27252,7 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 32000 }, "temperature": true, "tool_call": true, @@ -27664,52 +27261,51 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2025-07", + "release_date": "2025-11-06", + "last_updated": "2026-01-28", "cost": { - "input": 2.68, - "output": 3.54 - }, - "type": "chat" + "input": 0.07, + "output": 0.3 + } }, { - "id": "gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", - "modalities": { + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", + "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2025-12-10", + "last_updated": "2026-01-28", "cost": { - "input": 10, - "output": 30 - }, - "type": "chat" + "input": 0.75, + "output": 3.2, + "cache_read": 0.375 + } }, { - "id": "gpt-3.5-turbo-0613", - "name": "GPT-3.5 Turbo 0613", - "display_name": "GPT-3.5 Turbo 0613", + "id": "qwen3-235b-a22b-thinking-2507", + "name": "Qwen 3 235B A22B Thinking 2507", + "display_name": "Qwen 3 235B A22B Thinking 2507", "modalities": { "input": [ "text" @@ -27719,29 +27315,29 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 128000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-06-13", - "last_updated": "2023-06-13", + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-04-29", + "last_updated": "2026-01-28", "cost": { - "input": 3, - "output": 4 - }, - "type": "chat" + "input": 0.45, + "output": 3.5 + } }, { - "id": "phi-3.5-mini-instruct", - "name": "Phi-3.5-mini-instruct", - "display_name": "Phi-3.5-mini-instruct", + "id": "zai-org-glm-4.7-flash", + "name": "GLM 4.7 Flash", + "display_name": "GLM 4.7 Flash", "modalities": { "input": [ "text" @@ -27752,28 +27348,26 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "release_date": "2026-01-29", + "last_updated": "2026-01-30", "cost": { - "input": 0.13, - "output": 0.52 - }, - "type": "chat" + "input": 0.125, + "output": 0.5 + } }, { - "id": "o1-preview", - "name": "o1-preview", - "display_name": "o1-preview", + "id": "llama-3.2-3b", + "name": "Llama 3.2 3B", + "display_name": "Llama 3.2 3B", "modalities": { "input": [ "text" @@ -27784,62 +27378,59 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-10-03", + "last_updated": "2026-01-28", "cost": { - "input": 16.5, - "output": 66, - "cache_read": 8.25 - }, - "type": "chat" + "input": 0.15, + "output": 0.6 + } }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "google-gemma-3-27b-it", + "name": "Google Gemma 3 27B Instruct", + "display_name": "Google Gemma 3 27B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 198000, + "output": 49500 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "knowledge": "2025-07", + "release_date": "2025-11-04", + "last_updated": "2026-01-28", "cost": { - "input": 0.71, - "output": 0.71 - }, - "type": "chat" + "input": 0.12, + "output": 0.2 + } }, { - "id": "gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex Mini", - "display_name": "GPT-5.1 Codex Mini", + "id": "kimi-k2-5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", @@ -27850,31 +27441,61 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "attachment": true, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2026-01-27", + "last_updated": "2026-01-28", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.75, + "output": 3.75, + "cache_read": 0.125 + } + }, + { + "id": "hermes-3-llama-3.1-405b", + "name": "Hermes 3 Llama 3.1 405b", + "display_name": "Hermes 3 Llama 3.1 405b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] }, - "type": "chat" + "limit": { + "context": 128000, + "output": 32000 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2025-09-25", + "last_updated": "2026-01-28", + "cost": { + "input": 1.1, + "output": 3 + } }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "minimax-m21", + "name": "MiniMax M2.1", + "display_name": "MiniMax M2.1", "modalities": { "input": [ "text" @@ -27884,8 +27505,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 198000, + "output": 49500 }, "temperature": true, "tool_call": true, @@ -27895,51 +27516,49 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-12-02", + "release_date": "2025-12-01", + "last_updated": "2026-01-28", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 - }, - "type": "chat" + "input": 0.4, + "output": 1.6, + "cache_read": 0.04 + } }, { - "id": "model-router", - "name": "Model Router", - "display_name": "Model Router", + "id": "qwen3-next-80b", + "name": "Qwen 3 Next 80b", + "display_name": "Qwen 3 Next 80b", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 256000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-19", - "last_updated": "2025-11-18", + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-04-29", + "last_updated": "2026-01-28", "cost": { - "input": 0.14, - "output": 0 - }, - "type": "chat" + "input": 0.35, + "output": 1.9 + } }, { - "id": "o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "qwen3-coder-480b-a35b-instruct", + "name": "Qwen 3 Coder 480b", + "display_name": "Qwen 3 Coder 480b", "modalities": { "input": [ "text" @@ -27949,48 +27568,42 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 256000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-04-29", + "last_updated": "2026-01-28", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 - }, - "type": "chat" + "input": 0.75, + "output": 3 + } }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "openai-gpt-52-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ "text", - "image", - "audio" + "image" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 256000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -27998,69 +27611,74 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "knowledge": "2025-08", + "release_date": "2025-01-15", + "last_updated": "2026-01-28", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 - }, - "type": "chat" + "input": 2.19, + "output": 17.5, + "cache_read": 0.219 + } }, { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 160000, + "output": 40000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "knowledge": "2025-10", + "release_date": "2025-12-04", + "last_updated": "2026-01-28", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.01 - }, - "type": "chat" - }, + "input": 0.4, + "output": 1, + "cache_read": 0.2 + } + } + ] + }, + "siliconflow": { + "id": "siliconflow", + "name": "SiliconFlow", + "display_name": "SiliconFlow", + "api": "https://api.siliconflow.cn/v1", + "doc": "https://cloud.siliconflow.com/models", + "models": [ { - "id": "gpt-5-codex", - "name": "GPT-5-Codex", - "display_name": "GPT-5-Codex", + "id": "inclusionAI/Ring-flash-2.0", + "name": "inclusionAI/Ring-flash-2.0", + "display_name": "inclusionAI/Ring-flash-2.0", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -28068,31 +27686,28 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "release_date": "2025-09-29", + "last_updated": "2025-11-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "llama-3.2-90b-vision-instruct", - "name": "Llama-3.2-90B-Vision-Instruct", - "display_name": "Llama-3.2-90B-Vision-Instruct", + "id": "inclusionAI/Ling-flash-2.0", + "name": "inclusionAI/Ling-flash-2.0", + "display_name": "inclusionAI/Ling-flash-2.0", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, "temperature": true, @@ -28100,21 +27715,20 @@ "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "attachment": false, + "open_weights": false, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 2.04, - "output": 2.04 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "phi-3-mini-128k-instruct", - "name": "Phi-3-mini-instruct (128k)", - "display_name": "Phi-3-mini-instruct (128k)", + "id": "inclusionAI/Ling-mini-2.0", + "name": "inclusionAI/Ling-mini-2.0", + "display_name": "inclusionAI/Ling-mini-2.0", "modalities": { "input": [ "text" @@ -28124,33 +27738,31 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "open_weights": false, + "release_date": "2025-09-10", + "last_updated": "2025-11-25", "cost": { - "input": 0.13, - "output": 0.52 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "Kwaipilot/KAT-Dev", + "name": "Kwaipilot/KAT-Dev", + "display_name": "Kwaipilot/KAT-Dev", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -28158,29 +27770,26 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "release_date": "2025-09-27", + "last_updated": "2026-01-16", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 - }, - "type": "chat" + "input": 0.2, + "output": 0.6 + } }, { - "id": "gpt-3.5-turbo-0301", - "name": "GPT-3.5 Turbo 0301", - "display_name": "GPT-3.5 Turbo 0301", + "id": "moonshotai/Kimi-K2-Thinking", + "name": "moonshotai/Kimi-K2-Thinking", + "display_name": "moonshotai/Kimi-K2-Thinking", "modalities": { "input": [ "text" @@ -28190,29 +27799,28 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 262000, + "output": 262000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-03-01", - "last_updated": "2023-03-01", + "release_date": "2025-11-07", + "last_updated": "2025-11-25", "cost": { - "input": 1.5, - "output": 2 - }, - "type": "chat" + "input": 0.55, + "output": 2.5 + } }, { - "id": "ministral-3b", - "name": "Ministral 3B", - "display_name": "Ministral 3B", + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "moonshotai/Kimi-K2-Instruct-0905", + "display_name": "moonshotai/Kimi-K2-Instruct-0905", "modalities": { "input": [ "text" @@ -28222,7 +27830,7 @@ ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, "temperature": true, @@ -28231,124 +27839,112 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-03", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "open_weights": false, + "release_date": "2025-09-08", + "last_updated": "2025-11-25", "cost": { - "input": 0.04, - "output": 0.04 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "moonshotai/Kimi-Dev-72B", + "name": "moonshotai/Kimi-Dev-72B", + "display_name": "moonshotai/Kimi-Dev-72B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2025-06-19", + "last_updated": "2025-11-25", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.29, + "output": 1.15 }, "type": "chat" }, { - "id": "o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "tencent/Hunyuan-A13B-Instruct", + "name": "tencent/Hunyuan-A13B-Instruct", + "display_name": "tencent/Hunyuan-A13B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2025-06-30", + "last_updated": "2025-11-25", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "phi-4-multimodal", - "name": "Phi-4-multimodal", - "display_name": "Phi-4-multimodal", + "id": "tencent/Hunyuan-MT-7B", + "name": "tencent/Hunyuan-MT-7B", + "display_name": "tencent/Hunyuan-MT-7B", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "attachment": false, + "open_weights": false, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.08, - "output": 0.32, - "input_audio": 4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "meta-llama-3-8b-instruct", - "name": "Meta-Llama-3-8B-Instruct", - "display_name": "Meta-Llama-3-8B-Instruct", + "id": "MiniMaxAI/MiniMax-M1-80k", + "name": "MiniMaxAI/MiniMax-M1-80k", + "display_name": "MiniMaxAI/MiniMax-M1-80k", "modalities": { "input": [ "text" @@ -28358,64 +27954,58 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "open_weights": false, + "release_date": "2025-06-17", + "last_updated": "2025-11-25", "cost": { - "input": 0.3, - "output": 0.61 + "input": 0.55, + "output": 2.2 }, "type": "chat" }, { - "id": "o1", - "name": "o1", - "display_name": "o1", + "id": "MiniMaxAI/MiniMax-M2", + "name": "MiniMaxAI/MiniMax-M2", + "display_name": "MiniMaxAI/MiniMax-M2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 197000, + "output": 131000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "release_date": "2025-10-28", + "last_updated": "2025-11-25", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 - }, - "type": "chat" + "input": 0.3, + "output": 1.2 + } }, { - "id": "grok-3-mini", - "name": "Grok 3 Mini", - "display_name": "Grok 3 Mini", + "id": "THUDM/GLM-Z1-32B-0414", + "name": "THUDM/GLM-Z1-32B-0414", + "display_name": "THUDM/GLM-Z1-32B-0414", "modalities": { "input": [ "text" @@ -28431,64 +28021,53 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "release_date": "2025-04-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.3, - "output": 0.5, - "reasoning": 0.5, - "cache_read": 0.075 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "gpt-5.1-chat", - "name": "GPT-5.1 Chat", - "display_name": "GPT-5.1 Chat", + "id": "THUDM/GLM-4-9B-0414", + "name": "THUDM/GLM-4-9B-0414", + "display_name": "THUDM/GLM-4-9B-0414", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "release_date": "2025-04-18", + "last_updated": "2025-11-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.086, + "output": 0.086 }, "type": "chat" }, { - "id": "phi-3.5-moe-instruct", - "name": "Phi-3.5-MoE-instruct", - "display_name": "Phi-3.5-MoE-instruct", + "id": "THUDM/GLM-Z1-9B-0414", + "name": "THUDM/GLM-Z1-9B-0414", + "display_name": "THUDM/GLM-Z1-9B-0414", "modalities": { "input": [ "text" @@ -28498,43 +28077,41 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "open_weights": false, + "release_date": "2025-04-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.16, - "output": 0.64 + "input": 0.086, + "output": 0.086 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "THUDM/GLM-4.1V-9B-Thinking", + "name": "THUDM/GLM-4.1V-9B-Thinking", + "display_name": "THUDM/GLM-4.1V-9B-Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -28542,20 +28119,18 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-07-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.03 + "input": 0.035, + "output": 0.14 }, "type": "chat" }, { - "id": "o1-mini", - "name": "o1-mini", - "display_name": "o1-mini", + "id": "THUDM/GLM-4-32B-0414", + "name": "THUDM/GLM-4-32B-0414", + "display_name": "THUDM/GLM-4-32B-0414", "modalities": { "input": [ "text" @@ -28565,42 +28140,38 @@ ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "release_date": "2025-04-18", + "last_updated": "2025-11-25", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.27, + "output": 0.27 }, "type": "chat" }, { - "id": "llama-4-scout-17b-16e-instruct", - "name": "Llama 4 Scout 17B 16E Instruct", - "display_name": "Llama 4 Scout 17B 16E Instruct", + "id": "ascend-tribe/pangu-pro-moe", + "name": "ascend-tribe/pangu-pro-moe", + "display_name": "ascend-tribe/pangu-pro-moe", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, "temperature": true, @@ -28608,21 +28179,20 @@ "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "attachment": false, + "open_weights": false, + "release_date": "2025-07-02", + "last_updated": "2026-01-16", "cost": { "input": 0.2, - "output": 0.78 + "output": 0.6 }, "type": "chat" }, { - "id": "cohere-embed-v3-english", - "name": "Embed v3 English", - "display_name": "Embed v3 English", + "id": "stepfun-ai/step3", + "name": "stepfun-ai/step3", + "display_name": "stepfun-ai/step3", "modalities": { "input": [ "text" @@ -28632,28 +28202,28 @@ ] }, "limit": { - "context": 512, - "output": 1024 + "context": 131072, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2023-11-07", - "last_updated": "2023-11-07", + "attachment": true, + "open_weights": false, + "release_date": "2025-08-06", + "last_updated": "2025-11-25", "cost": { - "input": 0.1, - "output": 0 + "input": 0.57, + "output": 1.42 }, "type": "chat" }, { - "id": "text-embedding-ada-002", - "name": "text-embedding-ada-002", - "display_name": "text-embedding-ada-002", + "id": "baidu/ERNIE-4.5-300B-A47B", + "name": "baidu/ERNIE-4.5-300B-A47B", + "display_name": "baidu/ERNIE-4.5-300B-A47B", "modalities": { "input": [ "text" @@ -28663,27 +28233,28 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 131072, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2022-12-15", - "last_updated": "2022-12-15", + "release_date": "2025-07-02", + "last_updated": "2025-11-25", "cost": { - "input": 0.1, - "output": 0 + "input": 0.28, + "output": 1.1 }, - "type": "embedding" + "type": "chat" }, { - "id": "meta-llama-3.1-8b-instruct", - "name": "Meta-Llama-3.1-8B-Instruct", - "display_name": "Meta-Llama-3.1-8B-Instruct", + "id": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "display_name": "ByteDance-Seed/Seed-OSS-36B-Instruct", "modalities": { "input": [ "text" @@ -28693,8 +28264,8 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -28702,55 +28273,51 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "open_weights": false, + "release_date": "2025-09-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.3, - "output": 0.61 + "input": 0.21, + "output": 0.57 }, "type": "chat" }, { - "id": "gpt-5.1-codex-max", - "name": "GPT-5.1 Codex Max", - "display_name": "GPT-5.1 Codex Max", + "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "name": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "display_name": "Qwen/Qwen3-Next-80B-A3B-Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-09-25", + "last_updated": "2025-11-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-instruct", - "name": "GPT-3.5 Turbo Instruct", - "display_name": "GPT-3.5 Turbo Instruct", + "id": "Qwen/Qwen2.5-14B-Instruct", + "name": "Qwen/Qwen2.5-14B-Instruct", + "display_name": "Qwen/Qwen2.5-14B-Instruct", "modalities": { "input": [ "text" @@ -28760,29 +28327,28 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-09-21", - "last_updated": "2023-09-21", + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 1.5, - "output": 2 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Next-80B-A3B-Instruct", "modalities": { "input": [ "text" @@ -28792,8 +28358,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -28801,20 +28367,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "open_weights": false, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.14, + "output": 1.4 }, "type": "chat" }, { - "id": "o3", - "name": "o3", - "display_name": "o3", + "id": "Qwen/Qwen3-VL-32B-Instruct", + "name": "Qwen/Qwen3-VL-32B-Instruct", + "display_name": "Qwen/Qwen3-VL-32B-Instruct", "modalities": { "input": [ "text", @@ -28825,31 +28390,27 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262000, + "output": 262000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2025-10-21", + "last_updated": "2025-11-25", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 - }, - "type": "chat" + "input": 0.2, + "output": 0.6 + } }, { - "id": "codex-mini", - "name": "Codex Mini", - "display_name": "Codex Mini", + "id": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "display_name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", "modalities": { "input": [ "text" @@ -28859,10 +28420,10 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -28870,20 +28431,18 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-05-16", - "last_updated": "2025-05-16", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 1.5, - "output": 6, - "cache_read": 0.375 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "phi-3-medium-4k-instruct", - "name": "Phi-3-medium-instruct (4k)", - "display_name": "Phi-3-medium-instruct (4k)", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "display_name": "Qwen/Qwen3-235B-A22B-Thinking-2507", "modalities": { "input": [ "text" @@ -28893,95 +28452,93 @@ ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "open_weights": false, + "release_date": "2025-07-28", + "last_updated": "2025-11-25", "cost": { - "input": 0.17, - "output": 0.68 + "input": 0.13, + "output": 0.6 }, "type": "chat" }, { - "id": "phi-4-reasoning", - "name": "Phi-4-reasoning", - "display_name": "Phi-4-reasoning", + "id": "Qwen/Qwen3-VL-32B-Thinking", + "name": "Qwen/Qwen3-VL-32B-Thinking", + "display_name": "Qwen/Qwen3-VL-32B-Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 262000, + "output": 262000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "attachment": true, + "open_weights": false, + "release_date": "2025-10-21", + "last_updated": "2025-11-25", "cost": { - "input": 0.125, - "output": 0.5 - }, - "type": "chat" + "input": 0.2, + "output": 1.5 + } }, { - "id": "gpt-4-turbo-vision", - "name": "GPT-4 Turbo Vision", - "display_name": "GPT-4 Turbo Vision", + "id": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "name": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "display_name": "Qwen/Qwen3-VL-30B-A3B-Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "release_date": "2025-10-11", + "last_updated": "2025-11-25", "cost": { - "input": 10, - "output": 30 + "input": 0.29, + "output": 1 }, "type": "chat" }, { - "id": "phi-4-reasoning-plus", - "name": "Phi-4-reasoning-plus", - "display_name": "Phi-4-reasoning-plus", + "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "name": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "display_name": "Qwen/Qwen3-30B-A3B-Instruct-2507", "modalities": { "input": [ "text" @@ -28991,99 +28548,90 @@ ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": false, + "release_date": "2025-07-30", + "last_updated": "2025-11-25", "cost": { - "input": 0.125, - "output": 0.5 + "input": 0.09, + "output": 0.3 }, "type": "chat" }, { - "id": "gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "name": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "display_name": "Qwen/Qwen3-VL-235B-A22B-Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 + "input": 0.45, + "output": 3.5 }, "type": "chat" }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "display_name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-07-31", + "last_updated": "2025-11-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 - }, - "type": "chat" + "input": 0.25, + "output": 1 + } }, { - "id": "mai-ds-r1", - "name": "MAI-DS-R1", - "display_name": "MAI-DS-R1", + "id": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "display_name": "Qwen/Qwen3-VL-235B-A22B-Instruct", "modalities": { "input": [ "text" @@ -29093,98 +28641,90 @@ ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 1.35, - "output": 5.4 + "input": 0.3, + "output": 1.5 }, "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "Qwen/Qwen3-VL-8B-Instruct", + "name": "Qwen/Qwen3-VL-8B-Instruct", + "display_name": "Qwen/Qwen3-VL-8B-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "attachment": true, + "open_weights": false, + "release_date": "2025-10-15", + "last_updated": "2025-11-25", "cost": { - "input": 0.28, - "output": 0.42, - "cache_read": 0.028 - }, - "type": "chat" + "input": 0.18, + "output": 0.68 + } }, { - "id": "gpt-5-pro", - "name": "GPT-5 Pro", - "display_name": "GPT-5 Pro", + "id": "Qwen/Qwen3-32B", + "name": "Qwen/Qwen3-32B", + "display_name": "Qwen/Qwen3-32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 272000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "release_date": "2025-04-30", + "last_updated": "2025-11-25", "cost": { - "input": 15, - "output": 120 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "mistral-large-2411", - "name": "Mistral Large 24.11", - "display_name": "Mistral Large 24.11", + "id": "Qwen/QwQ-32B", + "name": "Qwen/QwQ-32B", + "display_name": "Qwen/QwQ-32B", "modalities": { "input": [ "text" @@ -29194,8 +28734,8 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -29204,54 +28744,49 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "release_date": "2025-03-06", + "last_updated": "2025-11-25", "cost": { - "input": 2, - "output": 6 + "input": 0.15, + "output": 0.58 }, "type": "chat" }, { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "Qwen/Qwen2.5-VL-72B-Instruct", + "name": "Qwen/Qwen2.5-VL-72B-Instruct", + "display_name": "Qwen/Qwen2.5-VL-72B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2025-01-28", + "last_updated": "2025-11-25", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.125 + "input": 0.59, + "output": 0.59 }, "type": "chat" }, { - "id": "codestral-2501", - "name": "Codestral 25.01", - "display_name": "Codestral 25.01", + "id": "Qwen/Qwen2.5-7B-Instruct", + "name": "Qwen/Qwen2.5-7B-Instruct", + "display_name": "Qwen/Qwen2.5-7B-Instruct", "modalities": { "input": [ "text" @@ -29261,8 +28796,8 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -29271,52 +28806,48 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-03", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.05, + "output": 0.05 }, "type": "chat" }, { - "id": "mistral-small-2503", - "name": "Mistral Small 3.1", - "display_name": "Mistral Small 3.1", + "id": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2025-03-01", - "last_updated": "2025-03-01", + "release_date": "2025-08-01", + "last_updated": "2025-11-25", "cost": { - "input": 0.1, - "output": 0.3 - }, - "type": "chat" + "input": 0.07, + "output": 0.28 + } }, { - "id": "gpt-3.5-turbo-1106", - "name": "GPT-3.5 Turbo 1106", - "display_name": "GPT-3.5 Turbo 1106", + "id": "Qwen/Qwen2.5-72B-Instruct", + "name": "Qwen/Qwen2.5-72B-Instruct", + "display_name": "Qwen/Qwen2.5-72B-Instruct", "modalities": { "input": [ "text" @@ -29326,38 +28857,28 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-11-06", - "last_updated": "2023-11-06", + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 1, - "output": 2 + "input": 0.59, + "output": 0.59 }, "type": "chat" - } - ] - }, - "baseten": { - "id": "baseten", - "name": "Baseten", - "display_name": "Baseten", - "api": "https://inference.baseten.co/v1", - "doc": "https://docs.baseten.co/development/model-apis/overview", - "models": [ + }, { - "id": "moonshotai/Kimi-K2-Instruct-0905", - "name": "Kimi K2 Instruct 0905", - "display_name": "Kimi K2 Instruct 0905", + "id": "Qwen/Qwen2.5-72B-Instruct-128K", + "name": "Qwen/Qwen2.5-72B-Instruct-128K", + "display_name": "Qwen/Qwen2.5-72B-Instruct-128K", "modalities": { "input": [ "text" @@ -29367,8 +28888,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -29376,20 +28897,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "open_weights": false, + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.6, - "output": 2.5 + "input": 0.59, + "output": 0.59 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "Qwen/Qwen2.5-32B-Instruct", + "name": "Qwen/Qwen2.5-32B-Instruct", + "display_name": "Qwen/Qwen2.5-32B-Instruct", "modalities": { "input": [ "text" @@ -29399,30 +28919,28 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "open_weights": false, + "release_date": "2024-09-19", + "last_updated": "2025-11-25", "cost": { - "input": 0.6, - "output": 2.5 + "input": 0.18, + "output": 0.18 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "Qwen/Qwen2.5-Coder-32B-Instruct", + "name": "Qwen/Qwen2.5-Coder-32B-Instruct", + "display_name": "Qwen/Qwen2.5-Coder-32B-Instruct", "modalities": { "input": [ "text" @@ -29432,8 +28950,8 @@ ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -29441,20 +28959,18 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": false, + "release_date": "2024-11-11", + "last_updated": "2025-11-25", "cost": { - "input": 0.38, - "output": 1.53 - }, - "type": "chat" + "input": 0.18, + "output": 0.18 + } }, { - "id": "zai-org/GLM-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "display_name": "Qwen/Qwen3-235B-A22B-Instruct-2507", "modalities": { "input": [ "text" @@ -29464,62 +28980,60 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": false, + "release_date": "2025-07-23", + "last_updated": "2025-11-25", "cost": { - "input": 0.6, - "output": 2.2 + "input": 0.09, + "output": 0.6 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "Qwen/Qwen3-VL-8B-Thinking", + "name": "Qwen/Qwen3-VL-8B-Thinking", + "display_name": "Qwen/Qwen3-VL-8B-Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-08-31", - "release_date": "2025-09-16", - "last_updated": "2025-09-16", + "attachment": true, + "open_weights": false, + "release_date": "2025-10-15", + "last_updated": "2025-11-25", "cost": { - "input": 0.6, - "output": 2.2 - }, - "type": "chat" + "input": 0.18, + "output": 2 + } }, { - "id": "deepseek-ai/DeepSeek-V3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", "modalities": { "input": [ "text" @@ -29529,38 +29043,28 @@ ] }, "limit": { - "context": 163800, - "output": 131100 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-10", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "attachment": true, + "open_weights": false, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.3, - "output": 0.45 + "input": 0.1, + "output": 0.4 }, "type": "chat" - } - ] - }, - "siliconflow-com": { - "id": "siliconflow-com", - "name": "SiliconFlow", - "display_name": "SiliconFlow", - "api": "https://api.siliconflow.com/v1", - "doc": "https://cloud.siliconflow.com/models", - "models": [ + }, { - "id": "inclusionAI/Ling-mini-2.0", - "name": "inclusionAI/Ling-mini-2.0", - "display_name": "inclusionAI/Ling-mini-2.0", + "id": "Qwen/Qwen3-8B", + "name": "Qwen/Qwen3-8B", + "display_name": "Qwen/Qwen3-8B", "modalities": { "input": [ "text" @@ -29570,8 +29074,8 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -29580,18 +29084,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-09-10", + "release_date": "2025-04-30", "last_updated": "2025-11-25", "cost": { - "input": 0.07, - "output": 0.28 + "input": 0.06, + "output": 0.06 }, "type": "chat" }, { - "id": "inclusionAI/Ling-flash-2.0", - "name": "inclusionAI/Ling-flash-2.0", - "display_name": "inclusionAI/Ling-flash-2.0", + "id": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "display_name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", "modalities": { "input": [ "text" @@ -29601,28 +29105,28 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-18", + "release_date": "2025-10-04", "last_updated": "2025-11-25", "cost": { - "input": 0.14, - "output": 0.57 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "inclusionAI/Ring-flash-2.0", - "name": "inclusionAI/Ring-flash-2.0", - "display_name": "inclusionAI/Ring-flash-2.0", + "id": "Qwen/Qwen2.5-VL-32B-Instruct", + "name": "Qwen/Qwen2.5-VL-32B-Instruct", + "display_name": "Qwen/Qwen2.5-VL-32B-Instruct", "modalities": { "input": [ "text" @@ -29632,29 +29136,28 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-29", + "release_date": "2025-03-24", "last_updated": "2025-11-25", "cost": { - "input": 0.14, - "output": 0.57 + "input": 0.27, + "output": 0.27 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Instruct", - "name": "moonshotai/Kimi-K2-Instruct", - "display_name": "moonshotai/Kimi-K2-Instruct", + "id": "Qwen/Qwen3-14B", + "name": "Qwen/Qwen3-14B", + "display_name": "Qwen/Qwen3-14B", "modalities": { "input": [ "text" @@ -29664,8 +29167,8 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -29674,18 +29177,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-13", + "release_date": "2025-04-30", "last_updated": "2025-11-25", "cost": { - "input": 0.58, - "output": 2.29 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "moonshotai/Kimi-Dev-72B", - "name": "moonshotai/Kimi-Dev-72B", - "display_name": "moonshotai/Kimi-Dev-72B", + "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "name": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "display_name": "Qwen/Qwen3-VL-30B-A3B-Instruct", "modalities": { "input": [ "text" @@ -29695,28 +29198,28 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-06-19", + "release_date": "2025-10-05", "last_updated": "2025-11-25", "cost": { "input": 0.29, - "output": 1.15 + "output": 1 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Instruct-0905", - "name": "moonshotai/Kimi-K2-Instruct-0905", - "display_name": "moonshotai/Kimi-K2-Instruct-0905", + "id": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "name": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "display_name": "Qwen/Qwen3-30B-A3B-Thinking-2507", "modalities": { "input": [ "text" @@ -29726,28 +29229,29 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-09-08", + "release_date": "2025-07-31", "last_updated": "2025-11-25", "cost": { - "input": 0.4, - "output": 2 + "input": 0.09, + "output": 0.3 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "moonshotai/Kimi-K2-Thinking", - "display_name": "moonshotai/Kimi-K2-Thinking", + "id": "Qwen/Qwen3-30B-A3B", + "name": "Qwen/Qwen3-30B-A3B", + "display_name": "Qwen/Qwen3-30B-A3B", "modalities": { "input": [ "text" @@ -29757,29 +29261,28 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-11-07", + "release_date": "2025-04-30", "last_updated": "2025-11-25", "cost": { - "input": 0.55, - "output": 2.5 + "input": 0.09, + "output": 0.45 }, "type": "chat" }, { - "id": "tencent/Hunyuan-MT-7B", - "name": "tencent/Hunyuan-MT-7B", - "display_name": "tencent/Hunyuan-MT-7B", + "id": "zai-org/GLM-4.5-Air", + "name": "zai-org/GLM-4.5-Air", + "display_name": "zai-org/GLM-4.5-Air", "modalities": { "input": [ "text" @@ -29789,8 +29292,8 @@ ] }, "limit": { - "context": 33000, - "output": 33000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -29799,18 +29302,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-09-18", + "release_date": "2025-07-28", "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 + "input": 0.14, + "output": 0.86 }, "type": "chat" }, { - "id": "tencent/Hunyuan-A13B-Instruct", - "name": "tencent/Hunyuan-A13B-Instruct", - "display_name": "tencent/Hunyuan-A13B-Instruct", + "id": "zai-org/GLM-4.5V", + "name": "zai-org/GLM-4.5V", + "display_name": "zai-org/GLM-4.5V", "modalities": { "input": [ "text" @@ -29820,28 +29323,28 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-06-30", + "release_date": "2025-08-13", "last_updated": "2025-11-25", "cost": { "input": 0.14, - "output": 0.57 + "output": 0.86 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2", - "name": "MiniMaxAI/MiniMax-M2", - "display_name": "MiniMaxAI/MiniMax-M2", + "id": "zai-org/GLM-4.6", + "name": "zai-org/GLM-4.6", + "display_name": "zai-org/GLM-4.6", "modalities": { "input": [ "text" @@ -29851,8 +29354,8 @@ ] }, "limit": { - "context": 197000, - "output": 131000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -29861,21 +29364,22 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-10-28", + "release_date": "2025-10-04", "last_updated": "2025-11-25", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.5, + "output": 1.9 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M1-80k", - "name": "MiniMaxAI/MiniMax-M1-80k", - "display_name": "MiniMaxAI/MiniMax-M1-80k", + "id": "zai-org/GLM-4.6V", + "name": "zai-org/GLM-4.6V", + "display_name": "zai-org/GLM-4.6V", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -29891,20 +29395,19 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-06-17", - "last_updated": "2025-11-25", + "release_date": "2025-12-07", + "last_updated": "2025-12-07", "cost": { - "input": 0.55, - "output": 2.2 - }, - "type": "chat" + "input": 0.3, + "output": 0.9 + } }, { - "id": "THUDM/GLM-4-32B-0414", - "name": "THUDM/GLM-4-32B-0414", - "display_name": "THUDM/GLM-4-32B-0414", + "id": "deepseek-ai/DeepSeek-V3", + "name": "deepseek-ai/DeepSeek-V3", + "display_name": "deepseek-ai/DeepSeek-V3", "modalities": { "input": [ "text" @@ -29914,8 +29417,8 @@ ] }, "limit": { - "context": 33000, - "output": 33000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -29924,30 +29427,29 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-04-18", + "release_date": "2024-12-26", "last_updated": "2025-11-25", "cost": { - "input": 0.27, - "output": 0.27 + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "THUDM/GLM-4.1V-9B-Thinking", - "name": "THUDM/GLM-4.1V-9B-Thinking", - "display_name": "THUDM/GLM-4.1V-9B-Thinking", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "deepseek-ai/DeepSeek-V3.2", + "display_name": "deepseek-ai/DeepSeek-V3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 66000, - "output": 66000 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, @@ -29955,20 +29457,19 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-07-04", - "last_updated": "2025-11-25", + "release_date": "2025-12-03", + "last_updated": "2025-12-03", "cost": { - "input": 0.035, - "output": 0.14 - }, - "type": "chat" + "input": 0.27, + "output": 0.42 + } }, { - "id": "THUDM/GLM-Z1-9B-0414", - "name": "THUDM/GLM-Z1-9B-0414", - "display_name": "THUDM/GLM-Z1-9B-0414", + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", "modalities": { "input": [ "text" @@ -29978,8 +29479,8 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -29989,18 +29490,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-04-18", + "release_date": "2025-01-20", "last_updated": "2025-11-25", "cost": { - "input": 0.086, - "output": 0.086 + "input": 0.05, + "output": 0.05 }, "type": "chat" }, { - "id": "THUDM/GLM-4-9B-0414", - "name": "THUDM/GLM-4-9B-0414", - "display_name": "THUDM/GLM-4-9B-0414", + "id": "deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "deepseek-ai/DeepSeek-V3.1-Terminus", + "display_name": "deepseek-ai/DeepSeek-V3.1-Terminus", "modalities": { "input": [ "text" @@ -30010,28 +29511,29 @@ ] }, "limit": { - "context": 33000, - "output": 33000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-04-18", + "release_date": "2025-09-29", "last_updated": "2025-11-25", "cost": { - "input": 0.086, - "output": 0.086 + "input": 0.27, + "output": 1 }, "type": "chat" }, { - "id": "THUDM/GLM-Z1-32B-0414", - "name": "THUDM/GLM-Z1-32B-0414", - "display_name": "THUDM/GLM-Z1-32B-0414", + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", "modalities": { "input": [ "text" @@ -30041,8 +29543,8 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -30052,18 +29554,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-04-18", + "release_date": "2025-01-20", "last_updated": "2025-11-25", "cost": { - "input": 0.14, - "output": 0.57 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "openai/gpt-oss-20b", - "display_name": "openai/gpt-oss-20b", + "id": "deepseek-ai/deepseek-vl2", + "name": "deepseek-ai/deepseek-vl2", + "display_name": "deepseek-ai/deepseek-vl2", "modalities": { "input": [ "text" @@ -30073,28 +29575,28 @@ ] }, "limit": { - "context": 131000, - "output": 8000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-13", + "release_date": "2024-12-13", "last_updated": "2025-11-25", "cost": { - "input": 0.04, - "output": 0.18 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "openai/gpt-oss-120b", - "display_name": "openai/gpt-oss-120b", + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", "modalities": { "input": [ "text" @@ -30104,8 +29606,8 @@ ] }, "limit": { - "context": 131000, - "output": 8000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -30115,61 +29617,62 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-08-13", + "release_date": "2025-01-20", "last_updated": "2025-11-25", "cost": { - "input": 0.05, - "output": 0.45 + "input": 0.18, + "output": 0.18 }, "type": "chat" }, { - "id": "stepfun-ai/step3", - "name": "stepfun-ai/step3", - "display_name": "stepfun-ai/step3", + "id": "deepseek-ai/DeepSeek-R1", + "name": "deepseek-ai/DeepSeek-R1", + "display_name": "deepseek-ai/DeepSeek-R1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 66000, - "output": 66000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-06", + "release_date": "2025-05-28", "last_updated": "2025-11-25", "cost": { - "input": 0.57, - "output": 1.42 + "input": 0.5, + "output": 2.18 }, "type": "chat" }, { - "id": "nex-agi/DeepSeek-V3.1-Nex-N1", - "name": "nex-agi/DeepSeek-V3.1-Nex-N1", - "display_name": "nex-agi/DeepSeek-V3.1-Nex-N1", + "id": "Pro/moonshotai/Kimi-K2.5", + "name": "Pro/moonshotai/Kimi-K2.5", + "display_name": "Pro/moonshotai/Kimi-K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -30179,18 +29682,17 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-11-25", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.5, - "output": 2 - }, - "type": "chat" + "input": 0.55, + "output": 3 + } }, { - "id": "baidu/ERNIE-4.5-300B-A47B", - "name": "baidu/ERNIE-4.5-300B-A47B", - "display_name": "baidu/ERNIE-4.5-300B-A47B", + "id": "Pro/moonshotai/Kimi-K2-Instruct-0905", + "name": "Pro/moonshotai/Kimi-K2-Instruct-0905", + "display_name": "Pro/moonshotai/Kimi-K2-Instruct-0905", "modalities": { "input": [ "text" @@ -30200,8 +29702,8 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -30210,18 +29712,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-02", + "release_date": "2025-09-08", "last_updated": "2025-11-25", "cost": { - "input": 0.28, - "output": 1.1 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "z-ai/GLM-4.5", - "name": "z-ai/GLM-4.5", - "display_name": "z-ai/GLM-4.5", + "id": "Pro/moonshotai/Kimi-K2-Thinking", + "name": "Pro/moonshotai/Kimi-K2-Thinking", + "display_name": "Pro/moonshotai/Kimi-K2-Thinking", "modalities": { "input": [ "text" @@ -30231,28 +29733,28 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-07-28", + "release_date": "2025-11-07", "last_updated": "2025-11-25", "cost": { - "input": 0.4, - "output": 2 - }, - "type": "chat" + "input": 0.55, + "output": 2.5 + } }, { - "id": "z-ai/GLM-4.5-Air", - "name": "z-ai/GLM-4.5-Air", - "display_name": "z-ai/GLM-4.5-Air", + "id": "Pro/MiniMaxAI/MiniMax-M2.1", + "name": "Pro/MiniMaxAI/MiniMax-M2.1", + "display_name": "Pro/MiniMaxAI/MiniMax-M2.1", "modalities": { "input": [ "text" @@ -30262,7 +29764,7 @@ ] }, "limit": { - "context": 131000, + "context": 197000, "output": 131000 }, "temperature": true, @@ -30272,18 +29774,17 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.14, - "output": 0.86 - }, - "type": "chat" + "input": 0.3, + "output": 1.2 + } }, { - "id": "ByteDance-Seed/Seed-OSS-36B-Instruct", - "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", - "display_name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "id": "Pro/zai-org/GLM-4.7", + "name": "Pro/zai-org/GLM-4.7", + "display_name": "Pro/zai-org/GLM-4.7", "modalities": { "input": [ "text" @@ -30293,28 +29794,28 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 205000, + "output": 205000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-09-04", - "last_updated": "2025-11-25", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.21, - "output": 0.57 - }, - "type": "chat" + "input": 0.6, + "output": 2.2 + } }, { - "id": "meta-llama/Meta-Llama-3.1-8B-Instruct", - "name": "meta-llama/Meta-Llama-3.1-8B-Instruct", - "display_name": "meta-llama/Meta-Llama-3.1-8B-Instruct", + "id": "Pro/deepseek-ai/DeepSeek-R1", + "name": "Pro/deepseek-ai/DeepSeek-R1", + "display_name": "Pro/deepseek-ai/DeepSeek-R1", "modalities": { "input": [ "text" @@ -30324,28 +29825,29 @@ ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-04-23", + "release_date": "2025-05-28", "last_updated": "2025-11-25", "cost": { - "input": 0.06, - "output": 0.06 + "input": 0.5, + "output": 2.18 }, "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B", - "name": "Qwen/Qwen3-30B-A3B", - "display_name": "Qwen/Qwen3-30B-A3B", + "id": "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", + "display_name": "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", "modalities": { "input": [ "text" @@ -30355,28 +29857,29 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-04-30", + "release_date": "2025-09-29", "last_updated": "2025-11-25", "cost": { - "input": 0.09, - "output": 0.45 + "input": 0.27, + "output": 1 }, "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B-Thinking-2507", - "name": "Qwen/Qwen3-30B-A3B-Thinking-2507", - "display_name": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "id": "Pro/deepseek-ai/DeepSeek-V3.2", + "name": "Pro/deepseek-ai/DeepSeek-V3.2", + "display_name": "Pro/deepseek-ai/DeepSeek-V3.2", "modalities": { "input": [ "text" @@ -30386,8 +29889,8 @@ ] }, "limit": { - "context": 262000, - "output": 131000 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, @@ -30397,50 +29900,48 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-31", - "last_updated": "2025-11-25", + "release_date": "2025-12-03", + "last_updated": "2025-12-03", "cost": { - "input": 0.09, - "output": 0.3 - }, - "type": "chat" + "input": 0.27, + "output": 0.42 + } }, { - "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", - "name": "Qwen/Qwen3-VL-30B-A3B-Instruct", - "display_name": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "id": "Pro/deepseek-ai/DeepSeek-V3", + "name": "Pro/deepseek-ai/DeepSeek-V3", + "display_name": "Pro/deepseek-ai/DeepSeek-V3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-05", + "release_date": "2024-12-26", "last_updated": "2025-11-25", "cost": { - "input": 0.29, + "input": 0.25, "output": 1 }, "type": "chat" }, { - "id": "Qwen/Qwen3-14B", - "name": "Qwen/Qwen3-14B", - "display_name": "Qwen/Qwen3-14B", + "id": "deepseek-ai/DeepSeek-V3.2-Exp", + "name": "deepseek-ai/DeepSeek-V3.2-Exp", + "display_name": "deepseek-ai/DeepSeek-V3.2-Exp", "modalities": { "input": [ "text" @@ -30450,91 +29951,64 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", - "cost": { - "input": 0.07, - "output": 0.28 - }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-32B-Instruct", - "name": "Qwen/Qwen2.5-VL-32B-Instruct", - "display_name": "Qwen/Qwen2.5-VL-32B-Instruct", + "id": "Pro/deepseek-ai/DeepSeek-V3.2-Exp", + "name": "Pro/deepseek-ai/DeepSeek-V3.2-Exp", + "display_name": "Pro/deepseek-ai/DeepSeek-V3.2-Exp", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-03-24", - "last_updated": "2025-11-25", - "cost": { - "input": 0.27, - "output": 0.27 - }, "type": "chat" }, { - "id": "Qwen/Qwen3-Omni-30B-A3B-Captioner", - "name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", - "display_name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "id": "inclusionAI/Ring-1T", + "name": "inclusionAI/Ring-1T", + "display_name": "inclusionAI/Ring-1T", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 66000, - "output": 66000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", - "cost": { - "input": 0.1, - "output": 0.4 + "supported": true, + "default": true }, "type": "chat" }, { - "id": "Qwen/Qwen3-8B", - "name": "Qwen/Qwen3-8B", - "display_name": "Qwen/Qwen3-8B", + "id": "inclusionAI/Ling-1T", + "name": "inclusionAI/Ling-1T", + "display_name": "inclusionAI/Ling-1T", "modalities": { "input": [ "text" @@ -30544,156 +30018,107 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", - "cost": { - "input": 0.06, - "output": 0.06 - }, "type": "chat" }, { - "id": "Qwen/Qwen3-Omni-30B-A3B-Instruct", - "name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "id": "Qwen/Qwen-Image-Edit-2509", + "name": "Qwen/Qwen-Image-Edit-2509", + "display_name": "Qwen/Qwen-Image-Edit-2509", "modalities": { "input": [ - "text", "image", - "audio" + "text" ], "output": [ - "text" + "image" ] }, - "limit": { - "context": 66000, - "output": 66000 - }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", - "cost": { - "input": 0.1, - "output": 0.4 - }, - "type": "chat" + } }, { - "id": "Qwen/Qwen3-VL-8B-Thinking", - "name": "Qwen/Qwen3-VL-8B-Thinking", - "display_name": "Qwen/Qwen3-VL-8B-Thinking", + "id": "Qwen/Qwen-Image-Edit", + "name": "Qwen/Qwen-Image-Edit", + "display_name": "Qwen/Qwen-Image-Edit", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ - "text" + "image" ] }, - "limit": { - "context": 262000, - "output": 262000 - }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-11-25", - "cost": { - "input": 0.18, - "output": 2 - }, - "type": "chat" + "supported": false + } }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "display_name": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "id": "Qwen/Qwen-Image", + "name": "Qwen/Qwen-Image", + "display_name": "Qwen/Qwen-Image", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, - "limit": { - "context": 262000, - "output": 262000 - }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-07-23", - "last_updated": "2025-11-25", - "cost": { - "input": 0.09, - "output": 0.6 - }, - "type": "chat" + } }, { - "id": "Qwen/Qwen2.5-Coder-32B-Instruct", - "name": "Qwen/Qwen2.5-Coder-32B-Instruct", - "display_name": "Qwen/Qwen2.5-Coder-32B-Instruct", + "id": "Wan-AI/Wan2.2-I2V-A14B", + "name": "Wan-AI/Wan2.2-I2V-A14B", + "display_name": "Wan-AI/Wan2.2-I2V-A14B", "modalities": { "input": [ + "image", "text" ], "output": [ - "text" + "video" ] }, - "limit": { - "context": 33000, - "output": 4000 - }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false + } + }, + { + "id": "Wan-AI/Wan2.2-T2V-A14B", + "name": "Wan-AI/Wan2.2-T2V-A14B", + "display_name": "Wan-AI/Wan2.2-T2V-A14B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "video" + ] }, - "attachment": false, - "open_weights": false, - "release_date": "2024-11-11", - "last_updated": "2025-11-25", - "cost": { - "input": 0.18, - "output": 0.18 - }, - "type": "chat" + "tool_call": false, + "reasoning": { + "supported": false + } }, { - "id": "Qwen/Qwen2.5-32B-Instruct", - "name": "Qwen/Qwen2.5-32B-Instruct", - "display_name": "Qwen/Qwen2.5-32B-Instruct", + "id": "zai-org/GLM-4.5", + "name": "zai-org/GLM-4.5", + "display_name": "zai-org/GLM-4.5", "modalities": { "input": [ "text" @@ -30703,59 +30128,36 @@ ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2024-09-19", - "last_updated": "2025-11-25", - "cost": { - "input": 0.18, - "output": 0.18 - }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-72B-Instruct-128K", - "name": "Qwen/Qwen2.5-72B-Instruct-128K", - "display_name": "Qwen/Qwen2.5-72B-Instruct-128K", + "id": "TeleAI/TeleSpeechASR", + "name": "TeleAI/TeleSpeechASR", + "display_name": "TeleAI/TeleSpeechASR", "modalities": { "input": [ - "text" + "audio" ], "output": [ "text" ] }, - "limit": { - "context": 131000, - "output": 4000 - }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", - "cost": { - "input": 0.59, - "output": 0.59 - }, - "type": "chat" + } }, { - "id": "Qwen/Qwen2.5-72B-Instruct", - "name": "Qwen/Qwen2.5-72B-Instruct", - "display_name": "Qwen/Qwen2.5-72B-Instruct", + "id": "Pro/THUDM/GLM-4.1V-9B-Thinking", + "name": "Pro/THUDM/GLM-4.1V-9B-Thinking", + "display_name": "Pro/THUDM/GLM-4.1V-9B-Thinking", "modalities": { "input": [ "text" @@ -30765,28 +30167,20 @@ ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", - "cost": { - "input": 0.59, - "output": 0.59 + "supported": true, + "default": true }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-30B-A3B-Instruct", - "name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "id": "Tongyi-Zhiwen/QwenLong-L1-32B", + "name": "Tongyi-Zhiwen/QwenLong-L1-32B", + "display_name": "Tongyi-Zhiwen/QwenLong-L1-32B", "modalities": { "input": [ "text" @@ -30796,28 +30190,20 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-01", - "last_updated": "2025-11-25", - "cost": { - "input": 0.07, - "output": 0.28 + "supported": true, + "default": true }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-7B-Instruct", - "name": "Qwen/Qwen2.5-7B-Instruct", - "display_name": "Qwen/Qwen2.5-7B-Instruct", + "id": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", + "name": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", + "display_name": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", "modalities": { "input": [ "text" @@ -30827,250 +30213,171 @@ ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", - "cost": { - "input": 0.05, - "output": 0.05 + "supported": true, + "default": true }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B", - "name": "Qwen/Qwen3-235B-A22B", - "display_name": "Qwen/Qwen3-235B-A22B", + "id": "Qwen/Qwen3-Reranker-8B", + "name": "Qwen/Qwen3-Reranker-8B", + "display_name": "Qwen/Qwen3-Reranker-8B", "modalities": { "input": [ "text" ], "output": [ - "text" + "score" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 8192, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", - "cost": { - "input": 0.35, - "output": 1.42 - }, - "type": "chat" + } }, { - "id": "Qwen/Qwen2.5-VL-72B-Instruct", - "name": "Qwen/Qwen2.5-VL-72B-Instruct", - "display_name": "Qwen/Qwen2.5-VL-72B-Instruct", + "id": "Qwen/Qwen3-Embedding-8B", + "name": "Qwen/Qwen3-Embedding-8B", + "display_name": "Qwen/Qwen3-Embedding-8B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "embedding" ] }, "limit": { - "context": 131000, - "output": 4000 + "context": 8192, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-01-28", - "last_updated": "2025-11-25", - "cost": { - "input": 0.59, - "output": 0.59 - }, - "type": "chat" + "type": "embedding" }, { - "id": "Qwen/QwQ-32B", - "name": "Qwen/QwQ-32B", - "display_name": "Qwen/QwQ-32B", + "id": "Qwen/Qwen3-Reranker-4B", + "name": "Qwen/Qwen3-Reranker-4B", + "display_name": "Qwen/Qwen3-Reranker-4B", "modalities": { "input": [ "text" ], "output": [ - "text" + "score" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 8192, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-03-06", - "last_updated": "2025-11-25", - "cost": { - "input": 0.15, - "output": 0.58 - }, - "type": "chat" + "supported": false + } }, { - "id": "Qwen/Qwen2.5-VL-7B-Instruct", - "name": "Qwen/Qwen2.5-VL-7B-Instruct", - "display_name": "Qwen/Qwen2.5-VL-7B-Instruct", + "id": "Qwen/Qwen3-Embedding-4B", + "name": "Qwen/Qwen3-Embedding-4B", + "display_name": "Qwen/Qwen3-Embedding-4B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "embedding" ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 8192, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-01-28", - "last_updated": "2025-11-25", - "cost": { - "input": 0.05, - "output": 0.05 - }, - "type": "chat" + "type": "embedding" }, { - "id": "Qwen/Qwen3-32B", - "name": "Qwen/Qwen3-32B", - "display_name": "Qwen/Qwen3-32B", + "id": "Qwen/Qwen3-Reranker-0.6B", + "name": "Qwen/Qwen3-Reranker-0.6B", + "display_name": "Qwen/Qwen3-Reranker-0.6B", "modalities": { "input": [ "text" ], "output": [ - "text" + "score" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 8192, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", - "cost": { - "input": 0.14, - "output": 0.57 - }, - "type": "chat" + } }, { - "id": "Qwen/Qwen3-VL-8B-Instruct", - "name": "Qwen/Qwen3-VL-8B-Instruct", - "display_name": "Qwen/Qwen3-VL-8B-Instruct", + "id": "Qwen/Qwen3-Embedding-0.6B", + "name": "Qwen/Qwen3-Embedding-0.6B", + "display_name": "Qwen/Qwen3-Embedding-0.6B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "embedding" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 8192, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-11-25", - "cost": { - "input": 0.18, - "output": 0.68 - }, - "type": "chat" + "type": "embedding" }, { - "id": "Qwen/Qwen3-VL-235B-A22B-Instruct", - "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", - "display_name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "id": "Qwen/Qwen3-235B-A22B", + "name": "Qwen/Qwen3-235B-A22B", + "display_name": "Qwen/Qwen3-235B-A22B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", - "cost": { - "input": 0.3, - "output": 1.5 - }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "display_name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "id": "Pro/Qwen/Qwen2.5-VL-7B-Instruct", + "name": "Pro/Qwen/Qwen2.5-VL-7B-Instruct", + "display_name": "Pro/Qwen/Qwen2.5-VL-7B-Instruct", "modalities": { "input": [ "text" @@ -31080,61 +30387,42 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-07-31", - "last_updated": "2025-11-25", - "cost": { - "input": 0.25, - "output": 1 - }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-235B-A22B-Thinking", - "name": "Qwen/Qwen3-VL-235B-A22B-Thinking", - "display_name": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "id": "Qwen/QVQ-72B-Preview", + "name": "Qwen/QVQ-72B-Preview", + "display_name": "Qwen/QVQ-72B-Preview", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", - "cost": { - "input": 0.45, - "output": 3.5 - }, "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "name": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "display_name": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "id": "deepseek-ai/DeepSeek-V2.5", + "name": "deepseek-ai/DeepSeek-V2.5", + "display_name": "deepseek-ai/DeepSeek-V2.5", "modalities": { "input": [ "text" @@ -31144,286 +30432,190 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-07-30", - "last_updated": "2025-11-25", - "cost": { - "input": 0.09, - "output": 0.3 - }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-30B-A3B-Thinking", - "name": "Qwen/Qwen3-VL-30B-A3B-Thinking", - "display_name": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "id": "fnlp/MOSS-TTSD-v0.5", + "name": "fnlp/MOSS-TTSD-v0.5", + "display_name": "fnlp/MOSS-TTSD-v0.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "audio" ] }, - "limit": { - "context": 262000, - "output": 262000 - }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-11", - "last_updated": "2025-11-25", - "cost": { - "input": 0.29, - "output": 1 + "supported": false + } + }, + { + "id": "FunAudioLLM/CosyVoice2-0.5B", + "name": "FunAudioLLM/CosyVoice2-0.5B", + "display_name": "FunAudioLLM/CosyVoice2-0.5B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] }, - "type": "chat" + "tool_call": false, + "reasoning": { + "supported": false + } }, { - "id": "Qwen/Qwen3-VL-32B-Thinking", - "name": "Qwen/Qwen3-VL-32B-Thinking", - "display_name": "Qwen/Qwen3-VL-32B-Thinking", + "id": "FunAudioLLM/SenseVoiceSmall", + "name": "FunAudioLLM/SenseVoiceSmall", + "display_name": "FunAudioLLM/SenseVoiceSmall", "modalities": { "input": [ - "text", - "image" + "audio" ], "output": [ "text" ] }, - "limit": { - "context": 262000, - "output": 262000 - }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-21", - "last_updated": "2025-11-25", - "cost": { - "input": 0.2, - "output": 1.5 - }, - "type": "chat" + "supported": false + } }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "display_name": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "id": "IndexTeam/IndexTTS-2", + "name": "IndexTeam/IndexTTS-2", + "display_name": "IndexTeam/IndexTTS-2", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, - "limit": { - "context": 262000, - "output": 262000 - }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", - "cost": { - "input": 0.13, - "output": 0.6 - }, - "type": "chat" + "supported": false + } }, { - "id": "Qwen/Qwen3-Omni-30B-A3B-Thinking", - "name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", - "display_name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "id": "BAAI/bge-m3", + "name": "BAAI/bge-m3", + "display_name": "BAAI/bge-m3", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 66000, - "output": 66000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", - "cost": { - "input": 0.1, - "output": 0.4 + "supported": false }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-32B-Instruct", - "name": "Qwen/Qwen3-VL-32B-Instruct", - "display_name": "Qwen/Qwen3-VL-32B-Instruct", + "id": "BAAI/bge-reranker-v2-m3", + "name": "BAAI/bge-reranker-v2-m3", + "display_name": "BAAI/bge-reranker-v2-m3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "score" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 8192, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-21", - "last_updated": "2025-11-25", - "cost": { - "input": 0.2, - "output": 0.6 - }, - "type": "chat" + } }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "id": "netease-youdao/bce-embedding-base_v1", + "name": "netease-youdao/bce-embedding-base_v1", + "display_name": "netease-youdao/bce-embedding-base_v1", "modalities": { "input": [ "text" ], "output": [ - "text" + "embedding" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 8192, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", - "cost": { - "input": 0.14, - "output": 1.4 - }, - "type": "chat" + "type": "embedding" }, { - "id": "Qwen/Qwen2.5-14B-Instruct", - "name": "Qwen/Qwen2.5-14B-Instruct", - "display_name": "Qwen/Qwen2.5-14B-Instruct", + "id": "netease-youdao/bce-reranker-base_v1", + "name": "netease-youdao/bce-reranker-base_v1", + "display_name": "netease-youdao/bce-reranker-base_v1", "modalities": { "input": [ "text" ], "output": [ - "text" + "score" ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 8192, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", - "cost": { - "input": 0.1, - "output": 0.1 - }, - "type": "chat" + } }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", - "name": "Qwen/Qwen3-Next-80B-A3B-Thinking", - "display_name": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "id": "Kwai-Kolors/Kolors", + "name": "Kwai-Kolors/Kolors", + "display_name": "Kwai-Kolors/Kolors", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, - "limit": { - "context": 262000, - "output": 262000 - }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-11-25", - "cost": { - "input": 0.14, - "output": 0.57 - }, - "type": "chat" + "supported": false + } }, { - "id": "zai-org/GLM-4.5", - "name": "zai-org/GLM-4.5", - "display_name": "zai-org/GLM-4.5", + "id": "Qwen/Qwen2-VL-72B-Instruct", + "name": "Qwen/Qwen2-VL-72B-Instruct", + "display_name": "Qwen/Qwen2-VL-72B-Instruct", "modalities": { "input": [ "text" @@ -31433,28 +30625,19 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", - "cost": { - "input": 0.4, - "output": 2 - }, "type": "chat" }, { - "id": "zai-org/GLM-4.6", - "name": "zai-org/GLM-4.6", - "display_name": "zai-org/GLM-4.6", + "id": "Qwen/Qwen2.5-Coder-7B-Instruct", + "name": "Qwen/Qwen2.5-Coder-7B-Instruct", + "display_name": "Qwen/Qwen2.5-Coder-7B-Instruct", "modalities": { "input": [ "text" @@ -31464,60 +30647,40 @@ ] }, "limit": { - "context": 205000, - "output": 205000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", - "cost": { - "input": 0.5, - "output": 1.9 - }, - "type": "chat" + } }, { - "id": "zai-org/GLM-4.5V", - "name": "zai-org/GLM-4.5V", - "display_name": "zai-org/GLM-4.5V", + "id": "internlm/internlm2_5-7b-chat", + "name": "internlm/internlm2_5-7b-chat", + "display_name": "internlm/internlm2_5-7b-chat", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 66000, - "output": 66000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-13", - "last_updated": "2025-11-25", - "cost": { - "input": 0.14, - "output": 0.86 - }, "type": "chat" }, { - "id": "zai-org/GLM-4.5-Air", - "name": "zai-org/GLM-4.5-Air", - "display_name": "zai-org/GLM-4.5-Air", + "id": "Qwen/Qwen2-7B-Instruct", + "name": "Qwen/Qwen2-7B-Instruct", + "display_name": "Qwen/Qwen2-7B-Instruct", "modalities": { "input": [ "text" @@ -31527,28 +30690,19 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", - "cost": { - "input": 0.14, - "output": 0.86 - }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1", - "name": "deepseek-ai/DeepSeek-R1", - "display_name": "deepseek-ai/DeepSeek-R1", + "id": "THUDM/glm-4-9b-chat", + "name": "THUDM/glm-4-9b-chat", + "display_name": "THUDM/glm-4-9b-chat", "modalities": { "input": [ "text" @@ -31558,29 +30712,19 @@ ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-11-25", - "cost": { - "input": 0.5, - "output": 2.18 + "supported": false }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "id": "BAAI/bge-large-en-v1.5", + "name": "BAAI/bge-large-en-v1.5", + "display_name": "BAAI/bge-large-en-v1.5", "modalities": { "input": [ "text" @@ -31590,61 +30734,41 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-11-25", - "cost": { - "input": 0.18, - "output": 0.18 + "supported": false }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-vl2", - "name": "deepseek-ai/deepseek-vl2", - "display_name": "deepseek-ai/deepseek-vl2", + "id": "BAAI/bge-large-zh-v1.5", + "name": "BAAI/bge-large-zh-v1.5", + "display_name": "BAAI/bge-large-zh-v1.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 4000, - "output": 4000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-12-13", - "last_updated": "2025-11-25", - "cost": { - "input": 0.15, - "output": 0.15 - }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "id": "LoRA/Qwen/Qwen2.5-32B-Instruct", + "name": "LoRA/Qwen/Qwen2.5-32B-Instruct", + "display_name": "LoRA/Qwen/Qwen2.5-32B-Instruct", "modalities": { "input": [ "text" @@ -31654,29 +30778,19 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-11-25", - "cost": { - "input": 0.1, - "output": 0.1 + "supported": false }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2-Exp", - "name": "deepseek-ai/DeepSeek-V3.2-Exp", - "display_name": "deepseek-ai/DeepSeek-V3.2-Exp", + "id": "LoRA/Qwen/Qwen2.5-14B-Instruct", + "name": "LoRA/Qwen/Qwen2.5-14B-Instruct", + "display_name": "LoRA/Qwen/Qwen2.5-14B-Instruct", "modalities": { "input": [ "text" @@ -31686,29 +30800,19 @@ ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-10-10", - "last_updated": "2025-11-25", - "cost": { - "input": 0.27, - "output": 0.41 + "supported": false }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1-Terminus", - "name": "deepseek-ai/DeepSeek-V3.1-Terminus", - "display_name": "deepseek-ai/DeepSeek-V3.1-Terminus", + "id": "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "name": "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "display_name": "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", "modalities": { "input": [ "text" @@ -31718,61 +30822,41 @@ ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-11-25", - "cost": { - "input": 0.27, - "output": 1 - }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "id": "deepseek-ai/DeepSeek-OCR", + "name": "deepseek-ai/DeepSeek-OCR", + "display_name": "deepseek-ai/DeepSeek-OCR", "modalities": { "input": [ - "text" + "image" ], "output": [ "text" ] }, "limit": { - "context": 33000, - "output": 16000 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-11-25", - "cost": { - "input": 0.05, - "output": 0.05 - }, - "type": "chat" + "supported": false + } }, { - "id": "deepseek-ai/DeepSeek-V3", - "name": "deepseek-ai/DeepSeek-V3", - "display_name": "deepseek-ai/DeepSeek-V3", + "id": "Pro/Qwen/Qwen2.5-Coder-7B-Instruct", + "name": "Pro/Qwen/Qwen2.5-Coder-7B-Instruct", + "display_name": "Pro/Qwen/Qwen2.5-Coder-7B-Instruct", "modalities": { "input": [ "text" @@ -31782,28 +30866,18 @@ ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-12-26", - "last_updated": "2025-11-25", - "cost": { - "input": 0.25, - "output": 1 - }, - "type": "chat" + } }, { - "id": "deepseek-ai/DeepSeek-V3.1", - "name": "deepseek-ai/DeepSeek-V3.1", - "display_name": "deepseek-ai/DeepSeek-V3.1", + "id": "Pro/BAAI/bge-m3", + "name": "Pro/BAAI/bge-m3", + "display_name": "Pro/BAAI/bge-m3", "modalities": { "input": [ "text" @@ -31813,142 +30887,84 @@ ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-25", - "last_updated": "2025-11-25", - "cost": { - "input": 0.27, - "output": 1 + "supported": false }, "type": "chat" - } - ] - }, - "helicone": { - "id": "helicone", - "name": "Helicone", - "display_name": "Helicone", - "api": "https://ai-gateway.helicone.ai/v1", - "doc": "https://helicone.ai/models", - "models": [ + }, { - "id": "gpt-4.1-nano", - "name": "OpenAI GPT-4.1 Nano", - "display_name": "OpenAI GPT-4.1 Nano", + "id": "Pro/Qwen/Qwen2.5-7B-Instruct", + "name": "Pro/Qwen/Qwen2.5-7B-Instruct", + "display_name": "Pro/Qwen/Qwen2.5-7B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 0.09999999999999999, - "output": 0.39999999999999997, - "cache_read": 0.024999999999999998 - }, "type": "chat" }, { - "id": "grok-4-fast-non-reasoning", - "name": "xAI Grok 4 Fast Non-Reasoning", - "display_name": "xAI Grok 4 Fast Non-Reasoning", + "id": "Pro/BAAI/bge-reranker-v2-m3", + "name": "Pro/BAAI/bge-reranker-v2-m3", + "display_name": "Pro/BAAI/bge-reranker-v2-m3", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ - "text" + "score" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 8192, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", - "cost": { - "input": 0.19999999999999998, - "output": 0.5, - "cache_read": 0.049999999999999996 - }, - "type": "chat" + } }, { - "id": "qwen3-coder", - "name": "Qwen3 Coder 480B A35B Instruct Turbo", - "display_name": "Qwen3 Coder 480B A35B Instruct Turbo", + "id": "LoRA/Qwen/Qwen2.5-72B-Instruct", + "name": "LoRA/Qwen/Qwen2.5-72B-Instruct", + "display_name": "LoRA/Qwen/Qwen2.5-72B-Instruct", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", - "cost": { - "input": 0.22, - "output": 0.95 - }, "type": "chat" }, { - "id": "deepseek-v3", - "name": "DeepSeek V3", - "display_name": "DeepSeek V3", + "id": "Pro/Qwen/Qwen2-7B-Instruct", + "name": "Pro/Qwen/Qwen2-7B-Instruct", + "display_name": "Pro/Qwen/Qwen2-7B-Instruct", "modalities": { "input": [ "text" @@ -31958,101 +30974,63 @@ ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-26", - "last_updated": "2024-12-26", - "cost": { - "input": 0.56, - "output": 1.68, - "cache_read": 0.07 - }, "type": "chat" }, { - "id": "claude-opus-4", - "name": "Anthropic: Claude Opus 4", - "display_name": "Anthropic: Claude Opus 4", + "id": "LoRA/Qwen/Qwen2.5-7B-Instruct", + "name": "LoRA/Qwen/Qwen2.5-7B-Instruct", + "display_name": "LoRA/Qwen/Qwen2.5-7B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-14", - "last_updated": "2025-05-14", - "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "supported": false }, "type": "chat" }, { - "id": "grok-4-fast-reasoning", - "name": "xAI: Grok 4 Fast Reasoning", - "display_name": "xAI: Grok 4 Fast Reasoning", + "id": "Pro/THUDM/glm-4-9b-chat", + "name": "Pro/THUDM/glm-4-9b-chat", + "display_name": "Pro/THUDM/glm-4-9b-chat", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-01", - "last_updated": "2025-09-01", - "cost": { - "input": 0.19999999999999998, - "output": 0.5, - "cache_read": 0.049999999999999996 + "supported": false }, "type": "chat" }, { - "id": "llama-3.1-8b-instant", - "name": "Meta Llama 3.1 8B Instant", - "display_name": "Meta Llama 3.1 8B Instant", + "id": "THUDM/GLM-Z1-Rumination-32B-0414", + "name": "THUDM/GLM-Z1-Rumination-32B-0414", + "display_name": "THUDM/GLM-Z1-Rumination-32B-0414", "modalities": { "input": [ "text" @@ -32063,400 +31041,262 @@ }, "limit": { "context": 131072, - "output": 32678 + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-01", - "last_updated": "2024-07-01", - "cost": { - "input": 0.049999999999999996, - "output": 0.08 + "supported": true, + "default": true }, "type": "chat" }, { - "id": "claude-opus-4-1", - "name": "Anthropic: Claude Opus 4.1", - "display_name": "Anthropic: Claude Opus 4.1", + "id": "stabilityai/stable-diffusion-xl-base-1.0", + "name": "stabilityai/stable-diffusion-xl-base-1.0", + "display_name": "stabilityai/stable-diffusion-xl-base-1.0", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, - "limit": { - "context": 200000, - "output": 32000 - }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-08", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" + "supported": false + } }, { - "id": "grok-4", - "name": "xAI Grok 4", - "display_name": "xAI Grok 4", + "id": "black-forest-labs/FLUX.1-schnell", + "name": "black-forest-labs/FLUX.1-schnell", + "display_name": "black-forest-labs/FLUX.1-schnell", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, - "limit": { - "context": 256000, - "output": 256000 - }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-09", - "last_updated": "2024-07-09", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 - }, - "type": "chat" + } }, { - "id": "qwen3-next-80b-a3b-instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "black-forest-labs/FLUX.1-dev", + "name": "black-forest-labs/FLUX.1-dev", + "display_name": "black-forest-labs/FLUX.1-dev", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ - "text" + "image" ] }, - "limit": { - "context": 262000, - "output": 16384 - }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", - "cost": { - "input": 0.14, - "output": 1.4 - }, - "type": "chat" + } }, { - "id": "llama-4-maverick", - "name": "Meta Llama 4 Maverick 17B 128E", - "display_name": "Meta Llama 4 Maverick 17B 128E", + "id": "Pro/black-forest-labs/FLUX.1-schnell", + "name": "Pro/black-forest-labs/FLUX.1-schnell", + "display_name": "Pro/black-forest-labs/FLUX.1-schnell", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, - "limit": { - "context": 131072, - "output": 8192 - }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", - "cost": { - "input": 0.15, - "output": 0.6 - }, - "type": "chat" + } }, { - "id": "llama-prompt-guard-2-86m", - "name": "Meta Llama Prompt Guard 2 86M", - "display_name": "Meta Llama Prompt Guard 2 86M", + "id": "stabilityai/stable-diffusion-3-5-large", + "name": "stabilityai/stable-diffusion-3-5-large", + "display_name": "stabilityai/stable-diffusion-3-5-large", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, - "limit": { - "context": 512, - "output": 2 - }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-01", - "cost": { - "input": 0.01, - "output": 0.01 - }, - "type": "chat" + } }, { - "id": "grok-4-1-fast-reasoning", - "name": "xAI Grok 4.1 Fast Reasoning", - "display_name": "xAI Grok 4.1 Fast Reasoning", + "id": "fishaudio/fish-speech-1.4", + "name": "fishaudio/fish-speech-1.4", + "display_name": "fishaudio/fish-speech-1.4", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "audio" ] }, - "limit": { - "context": 2000000, - "output": 2000000 - }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-17", - "last_updated": "2025-11-17", - "cost": { - "input": 0.19999999999999998, - "output": 0.5, - "cache_read": 0.049999999999999996 - }, - "type": "chat" + "supported": false + } }, { - "id": "grok-code-fast-1", - "name": "xAI Grok Code Fast 1", - "display_name": "xAI Grok Code Fast 1", + "id": "RVC-Boss/GPT-SoVITS", + "name": "RVC-Boss/GPT-SoVITS", + "display_name": "RVC-Boss/GPT-SoVITS", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, - "limit": { - "context": 256000, - "output": 10000 - }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-25", - "last_updated": "2024-08-25", - "cost": { - "input": 0.19999999999999998, - "output": 1.5, - "cache_read": 0.02 - }, - "type": "chat" + } }, { - "id": "claude-4.5-haiku", - "name": "Anthropic: Claude 4.5 Haiku", - "display_name": "Anthropic: Claude 4.5 Haiku", + "id": "fishaudio/fish-speech-1.5", + "name": "fishaudio/fish-speech-1.5", + "display_name": "fishaudio/fish-speech-1.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "audio" ] }, - "limit": { - "context": 200000, - "output": 8192 - }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-10", - "release_date": "2025-10-01", - "last_updated": "2025-10-01", - "cost": { - "input": 1, - "output": 5, - "cache_read": 0.09999999999999999, - "cache_write": 1.25 - }, - "type": "chat" + } }, { - "id": "llama-3.1-8b-instruct-turbo", - "name": "Meta Llama 3.1 8B Instruct Turbo", - "display_name": "Meta Llama 3.1 8B Instruct Turbo", + "id": "black-forest-labs/FLUX.1-pro", + "name": "black-forest-labs/FLUX.1-pro", + "display_name": "black-forest-labs/FLUX.1-pro", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, - "limit": { - "context": 128000, - "output": 128000 - }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", - "cost": { - "input": 0.02, - "output": 0.03 - }, - "type": "chat" + } }, { - "id": "gpt-5.1-codex", - "name": "OpenAI: GPT-5.1 Codex", - "display_name": "OpenAI: GPT-5.1 Codex", + "id": "LoRA/black-forest-labs/FLUX.1-dev", + "name": "LoRA/black-forest-labs/FLUX.1-dev", + "display_name": "LoRA/black-forest-labs/FLUX.1-dev", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", "image" ] }, - "limit": { - "context": 400000, - "output": 128000 - }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.12500000000000003 - }, - "type": "chat" + } }, { - "id": "gpt-4.1-mini-2025-04-14", - "name": "OpenAI GPT-4.1 Mini", - "display_name": "OpenAI GPT-4.1 Mini", + "id": "SeedLLM/Seed-Rice-7B", + "name": "SeedLLM/Seed-Rice-7B", + "display_name": "SeedLLM/Seed-Rice-7B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "type": "chat" + } + ] + }, + "vivgrid": { + "id": "vivgrid", + "name": "Vivgrid", + "display_name": "Vivgrid", + "api": "https://api.vivgrid.com/v1", + "doc": "https://docs.vivgrid.com/models", + "models": [ + { + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.39999999999999997, - "output": 1.5999999999999999, - "cache_read": 0.09999999999999999 - }, - "type": "chat" + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "context_over_200k": { + "input": 0.5, + "output": 3, + "cache_read": 0.05 + } + } }, { - "id": "llama-guard-4", - "name": "Meta Llama Guard 4 12B", - "display_name": "Meta Llama Guard 4 12B", + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ "text", @@ -32467,67 +31307,71 @@ ] }, "limit": { - "context": 131072, - "output": 1024 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-08-31", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 0.21, - "output": 0.21 - }, - "type": "chat" + "input": 1.75, + "output": 14, + "cache_read": 0.175 + } }, { - "id": "llama-3.1-8b-instruct", - "name": "Meta Llama 3.1 8B Instruct", - "display_name": "Meta Llama 3.1 8B Instruct", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.02, - "output": 0.049999999999999996 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.125 + } }, { "id": "gemini-3-pro-preview", - "name": "Google Gemini 3 Pro Preview", - "display_name": "Google Gemini 3 Pro Preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ "text", "image", + "video", "audio", - "video" + "pdf" ], "output": [ "text" @@ -32543,22 +31387,26 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-11", + "knowledge": "2025-01", "release_date": "2025-11-18", "last_updated": "2025-11-18", "cost": { "input": 2, "output": 12, - "cache_read": 0.19999999999999998 - }, - "type": "chat" + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } + } }, { - "id": "gemini-2.5-flash", - "name": "Google Gemini 2.5 Flash", - "display_name": "Google Gemini 2.5 Flash", + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", "modalities": { "input": [ "text", @@ -32569,10 +31417,10 @@ ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -32580,55 +31428,58 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.3 - }, - "type": "chat" - }, + "input": 1.25, + "output": 10, + "cache_read": 0.125 + } + } + ] + }, + "chutes": { + "id": "chutes", + "name": "Chutes", + "display_name": "Chutes", + "api": "https://llm.chutes.ai/v1", + "doc": "https://llm.chutes.ai/v1/models", + "models": [ { - "id": "gpt-4.1-mini", - "name": "OpenAI GPT-4.1 Mini", - "display_name": "OpenAI GPT-4.1 Mini", + "id": "NousResearch/Hermes-4.3-36B", + "name": "Hermes 4.3 36B", + "display_name": "Hermes 4.3 36B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 32768, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 0.39999999999999997, - "output": 1.5999999999999999, - "cache_read": 0.09999999999999999 - }, - "type": "chat" + "input": 0.1, + "output": 0.39 + } }, { - "id": "deepseek-v3.1-terminus", - "name": "DeepSeek V3.1 Terminus", - "display_name": "DeepSeek V3.1 Terminus", + "id": "NousResearch/Hermes-4-70B", + "name": "Hermes 4 70B", + "display_name": "Hermes 4 70B", "modalities": { "input": [ "text" @@ -32638,8 +31489,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -32648,21 +31499,18 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 0.27, - "output": 1, - "cache_read": 0.21600000000000003 - }, - "type": "chat" + "input": 0.11, + "output": 0.38 + } }, { - "id": "llama-prompt-guard-2-22m", - "name": "Meta Llama Prompt Guard 2 22M", - "display_name": "Meta Llama Prompt Guard 2 22M", + "id": "NousResearch/Hermes-4-14B", + "name": "Hermes 4 14B", + "display_name": "Hermes 4 14B", "modalities": { "input": [ "text" @@ -32672,64 +31520,59 @@ ] }, "limit": { - "context": 512, - "output": 2 + "context": 40960, + "output": 40960 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-01", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { "input": 0.01, - "output": 0.01 - }, - "type": "chat" + "output": 0.05 + } }, { - "id": "claude-3.5-sonnet-v2", - "name": "Anthropic: Claude 3.5 Sonnet v2", - "display_name": "Anthropic: Claude 3.5 Sonnet v2", + "id": "NousResearch/Hermes-4-405B-FP8-TEE", + "name": "Hermes 4 405B FP8 TEE", + "display_name": "Hermes 4 405B FP8 TEE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.30000000000000004, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0.3, + "output": 1.2 + } }, { - "id": "sonar-deep-research", - "name": "Perplexity Sonar Deep Research", - "display_name": "Perplexity Sonar Deep Research", + "id": "NousResearch/DeepHermes-3-Mistral-24B-Preview", + "name": "DeepHermes 3 Mistral 24B Preview", + "display_name": "DeepHermes 3 Mistral 24B Preview", "modalities": { "input": [ "text" @@ -32739,30 +31582,27 @@ ] }, "limit": { - "context": 127000, - "output": 4096 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-27", - "last_updated": "2025-01-27", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 2, - "output": 8 - }, - "type": "chat" + "input": 0.02, + "output": 0.1 + } }, { - "id": "gemini-2.5-flash-lite", - "name": "Google Gemini 2.5 Flash Lite", - "display_name": "Google Gemini 2.5 Flash Lite", + "id": "rednote-hilab/dots.ocr", + "name": "dots.ocr", + "display_name": "dots.ocr", "modalities": { "input": [ "text", @@ -32773,44 +31613,40 @@ ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-22", - "last_updated": "2025-07-22", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 0.09999999999999999, - "output": 0.39999999999999997, - "cache_read": 0.024999999999999998, - "cache_write": 0.09999999999999999 - }, - "type": "chat" + "input": 0.01, + "output": 0.01 + } }, { - "id": "claude-sonnet-4-5-20250929", - "name": "Anthropic: Claude Sonnet 4.5 (20250929)", - "display_name": "Anthropic: Claude Sonnet 4.5 (20250929)", + "id": "moonshotai/Kimi-K2.5-TEE", + "name": "Kimi K2.5 TEE", + "display_name": "Kimi K2.5 TEE", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -32819,22 +31655,19 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.30000000000000004, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0.6, + "output": 3 + } }, { - "id": "grok-3", - "name": "xAI Grok 3", - "display_name": "xAI Grok 3", + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "Kimi K2 Instruct 0905", + "display_name": "Kimi K2 Instruct 0905", "modalities": { "input": [ "text" @@ -32844,8 +31677,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -32853,54 +31686,49 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 - }, - "type": "chat" + "input": 0.39, + "output": 1.9 + } }, { - "id": "mistral-small", - "name": "Mistral Small", - "display_name": "Mistral Small", + "id": "moonshotai/Kimi-K2-Thinking-TEE", + "name": "Kimi K2 Thinking TEE", + "display_name": "Kimi K2 Thinking TEE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 262144, + "output": 65535 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-02", - "release_date": "2024-02-26", - "last_updated": "2024-02-26", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 75, - "output": 200 - }, - "type": "chat" + "input": 0.4, + "output": 1.75 + } }, { - "id": "kimi-k2-0711", - "name": "Kimi K2 (07/11)", - "display_name": "Kimi K2 (07/11)", + "id": "MiniMaxAI/MiniMax-M2.1-TEE", + "name": "MiniMax M2.1 TEE", + "display_name": "MiniMax M2.1 TEE", "modalities": { "input": [ "text" @@ -32910,41 +31738,39 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 196608, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-27", "cost": { - "input": 0.5700000000000001, - "output": 2.3 - }, - "type": "chat" + "input": 0.27, + "output": 1.12 + } }, { - "id": "chatgpt-4o-latest", - "name": "OpenAI ChatGPT-4o", - "display_name": "OpenAI ChatGPT-4o", + "id": "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16", + "name": "NVIDIA Nemotron 3 Nano 30B A3B BF16", + "display_name": "NVIDIA Nemotron 3 Nano 30B A3B BF16", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -32952,21 +31778,18 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-14", - "last_updated": "2024-08-14", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 5, - "output": 20, - "cache_read": 2.5 - }, - "type": "chat" + "input": 0.06, + "output": 0.24 + } }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen3 Coder 30B A3B Instruct", + "id": "tngtech/TNG-R1T-Chimera-Turbo", + "name": "TNG R1T Chimera Turbo", + "display_name": "TNG R1T Chimera Turbo", "modalities": { "input": [ "text" @@ -32976,31 +31799,30 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-31", - "last_updated": "2025-07-31", + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.09999999999999999, - "output": 0.3 - }, - "type": "chat" + "input": 0.22, + "output": 0.6 + } }, { - "id": "kimi-k2-0905", - "name": "Kimi K2 (09/05)", - "display_name": "Kimi K2 (09/05)", - "modalities": { - "input": [ + "id": "tngtech/DeepSeek-R1T-Chimera", + "name": "DeepSeek R1T Chimera", + "display_name": "DeepSeek R1T Chimera", + "modalities": { + "input": [ "text" ], "output": [ @@ -33008,30 +31830,28 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 163840, + "output": 163840 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 0.5, - "output": 2, - "cache_read": 0.39999999999999997 - }, - "type": "chat" + "input": 0.3, + "output": 1.2 + } }, { - "id": "sonar-reasoning", - "name": "Perplexity Sonar Reasoning", - "display_name": "Perplexity Sonar Reasoning", + "id": "tngtech/DeepSeek-TNG-R1T2-Chimera", + "name": "DeepSeek TNG R1T2 Chimera", + "display_name": "DeepSeek TNG R1T2 Chimera", "modalities": { "input": [ "text" @@ -33041,30 +31861,28 @@ ] }, "limit": { - "context": 127000, - "output": 4096 + "context": 163840, + "output": 163840 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-27", - "last_updated": "2025-01-27", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 1, - "output": 5 - }, - "type": "chat" + "input": 0.25, + "output": 0.85 + } }, { - "id": "llama-3.3-70b-instruct", - "name": "Meta Llama 3.3 70B Instruct", - "display_name": "Meta Llama 3.3 70B Instruct", + "id": "tngtech/TNG-R1T-Chimera-TEE", + "name": "TNG R1T Chimera TEE", + "display_name": "TNG R1T Chimera TEE", "modalities": { "input": [ "text" @@ -33074,96 +31892,89 @@ ] }, "limit": { - "context": 128000, - "output": 16400 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 0.13, - "output": 0.39 - }, - "type": "chat" + "input": 0.25, + "output": 0.85 + } }, { - "id": "gpt-5.1-codex-mini", - "name": "OpenAI: GPT-5.1 Codex Mini", - "display_name": "OpenAI: GPT-5.1 Codex Mini", + "id": "XiaomiMiMo/MiMo-V2-Flash", + "name": "MiMo V2 Flash", + "display_name": "MiMo V2 Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32768, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-27", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.024999999999999998 - }, - "type": "chat" + "input": 0.09, + "output": 0.29 + } }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "OpenGVLab/InternVL3-78B-TEE", + "name": "InternVL3 78B TEE", + "display_name": "InternVL3 78B TEE", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 262144 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "open_weights": true, + "release_date": "2025-01-06", + "last_updated": "2026-01-10", "cost": { - "input": 0.48, - "output": 2 - }, - "type": "chat" + "input": 0.1, + "output": 0.39 + } }, { - "id": "o3-mini", - "name": "OpenAI o3 Mini", - "display_name": "OpenAI o3 Mini", + "id": "openai/gpt-oss-120b-TEE", + "name": "gpt oss 120b TEE", + "display_name": "gpt oss 120b TEE", "modalities": { "input": [ "text" @@ -33173,42 +31984,39 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2023-10-01", - "last_updated": "2023-10-01", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 - }, - "type": "chat" + "input": 0.04, + "output": 0.18 + } }, { - "id": "claude-4.5-sonnet", - "name": "Anthropic: Claude Sonnet 4.5", - "display_name": "Anthropic: Claude Sonnet 4.5", + "id": "openai/gpt-oss-20b", + "name": "gpt oss 20b", + "display_name": "gpt oss 20b", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -33217,57 +32025,49 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.30000000000000004, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0.02, + "output": 0.1 + } }, { - "id": "gpt-5.1", - "name": "OpenAI GPT-5.1", - "display_name": "OpenAI GPT-5.1", + "id": "chutesai/Mistral-Small-3.1-24B-Instruct-2503", + "name": "Mistral Small 3.1 24B Instruct 2503", + "display_name": "Mistral Small 3.1 24B Instruct 2503", "modalities": { "input": [ "text", "image" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.12500000000000003 - }, - "type": "chat" + "input": 0.03, + "output": 0.11 + } }, { - "id": "codex-mini-latest", - "name": "OpenAI Codex Mini Latest", - "display_name": "OpenAI Codex Mini Latest", + "id": "chutesai/Mistral-Small-3.2-24B-Instruct-2506", + "name": "Mistral Small 3.2 24B Instruct 2506", + "display_name": "Mistral Small 3.2 24B Instruct 2506", "modalities": { "input": [ "text", @@ -33278,64 +32078,57 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 1.5, - "output": 6, - "cache_read": 0.375 - }, - "type": "chat" + "input": 0.06, + "output": 0.18 + } }, { - "id": "gpt-5-nano", - "name": "OpenAI GPT-5 Nano", - "display_name": "OpenAI GPT-5 Nano", + "id": "mistralai/Devstral-2-123B-Instruct-2512-TEE", + "name": "Devstral 2 123B Instruct 2512 TEE", + "display_name": "Devstral 2 123B Instruct 2512 TEE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "release_date": "2026-01-10", + "last_updated": "2026-01-10", "cost": { - "input": 0.049999999999999996, - "output": 0.39999999999999997, - "cache_read": 0.005 - }, - "type": "chat" + "input": 0.05, + "output": 0.22 + } }, { - "id": "gpt-5-codex", - "name": "OpenAI: GPT-5 Codex", - "display_name": "OpenAI: GPT-5 Codex", + "id": "unsloth/Mistral-Nemo-Instruct-2407", + "name": "Mistral Nemo Instruct 2407", + "display_name": "Mistral Nemo Instruct 2407", "modalities": { "input": [ "text" @@ -33345,30 +32138,58 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 131072 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.12500000000000003 + "input": 0.02, + "output": 0.04 + } + }, + { + "id": "unsloth/gemma-3-4b-it", + "name": "gemma 3 4b it", + "display_name": "gemma 3 4b it", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] }, - "type": "chat" + "limit": { + "context": 96000, + "output": 96000 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "cost": { + "input": 0.01, + "output": 0.03 + } }, { - "id": "gpt-4o", - "name": "OpenAI GPT-4o", - "display_name": "OpenAI GPT-4o", + "id": "unsloth/Mistral-Small-24B-Instruct-2501", + "name": "Mistral Small 24B Instruct 2501", + "display_name": "Mistral Small 24B Instruct 2501", "modalities": { "input": [ "text", @@ -33379,8 +32200,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -33388,21 +32209,18 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 - }, - "type": "chat" + "input": 0.03, + "output": 0.11 + } }, { - "id": "deepseek-tng-r1t2-chimera", - "name": "DeepSeek TNG R1T2 Chimera", - "display_name": "DeepSeek TNG R1T2 Chimera", + "id": "unsloth/Llama-3.2-1B-Instruct", + "name": "Llama 3.2 1B Instruct", + "display_name": "Llama 3.2 1B Instruct", "modalities": { "input": [ "text" @@ -33412,29 +32230,27 @@ ] }, "limit": { - "context": 130000, - "output": 163840 + "context": 32768, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-02", - "last_updated": "2025-07-02", + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.3, - "output": 1.2 - }, - "type": "chat" + "input": 0.01, + "output": 0.01 + } }, { - "id": "claude-4.5-opus", - "name": "Anthropic: Claude Opus 4.5", - "display_name": "Anthropic: Claude Opus 4.5", + "id": "unsloth/gemma-3-12b-it", + "name": "gemma 3 12b it", + "display_name": "gemma 3 12b it", "modalities": { "input": [ "text", @@ -33445,32 +32261,27 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5000000000000001, - "cache_write": 6.25 - }, - "type": "chat" + "input": 0.03, + "output": 0.1 + } }, { - "id": "gpt-4.1", - "name": "OpenAI GPT-4.1", - "display_name": "OpenAI GPT-4.1", + "id": "unsloth/gemma-3-27b-it", + "name": "gemma 3 27b it", + "display_name": "gemma 3 27b it", "modalities": { "input": [ "text", @@ -33481,8 +32292,8 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 96000, + "output": 96000 }, "temperature": true, "tool_call": true, @@ -33490,21 +32301,18 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 - }, - "type": "chat" + "input": 0.04, + "output": 0.15 + } }, { - "id": "sonar", - "name": "Perplexity Sonar", - "display_name": "Perplexity Sonar", + "id": "Qwen/Qwen3-30B-A3B", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", "modalities": { "input": [ "text" @@ -33514,29 +32322,28 @@ ] }, "limit": { - "context": 127000, - "output": 4096 + "context": 40960, + "output": 40960 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-27", - "last_updated": "2025-01-27", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 1, - "output": 1 - }, - "type": "chat" + "input": 0.06, + "output": 0.22 + } }, { - "id": "glm-4.6", - "name": "Zai GLM-4.6", - "display_name": "Zai GLM-4.6", + "id": "Qwen/Qwen3-14B", + "name": "Qwen3 14B", + "display_name": "Qwen3 14B", "modalities": { "input": [ "text" @@ -33546,8 +32353,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 40960, + "output": 40960 }, "temperature": true, "tool_call": true, @@ -33556,20 +32363,18 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 0.44999999999999996, - "output": 1.5 - }, - "type": "chat" + "input": 0.05, + "output": 0.22 + } }, { - "id": "o4-mini", - "name": "OpenAI o4 Mini", - "display_name": "OpenAI o4 Mini", + "id": "Qwen/Qwen2.5-VL-32B-Instruct", + "name": "Qwen2.5 VL 32B Instruct", + "display_name": "Qwen2.5 VL 32B Instruct", "modalities": { "input": [ "text", @@ -33580,65 +32385,57 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 16384, + "output": 16384 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.275 - }, - "type": "chat" + "input": 0.05, + "output": 0.22 + } }, { - "id": "qwen3-235b-a22b-thinking", - "name": "Qwen3 235B A22B Thinking", - "display_name": "Qwen3 235B A22B Thinking", + "id": "Qwen/Qwen3Guard-Gen-0.6B", + "name": "Qwen3Guard Gen 0.6B", + "display_name": "Qwen3Guard Gen 0.6B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 81920 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 0.3, - "output": 2.9000000000000004 - }, - "type": "chat" + "input": 0.01, + "output": 0.01 + } }, { - "id": "hermes-2-pro-llama-3-8b", - "name": "Hermes 2 Pro Llama 3 8B", - "display_name": "Hermes 2 Pro Llama 3 8B", + "id": "Qwen/Qwen2.5-Coder-32B-Instruct", + "name": "Qwen2.5 Coder 32B Instruct", + "display_name": "Qwen2.5 Coder 32B Instruct", "modalities": { "input": [ "text" @@ -33648,29 +32445,27 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-05-27", - "last_updated": "2024-05-27", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 0.14, - "output": 0.14 - }, - "type": "chat" + "input": 0.03, + "output": 0.11 + } }, { - "id": "o1", - "name": "OpenAI: o1", - "display_name": "OpenAI: o1", + "id": "Qwen/Qwen2.5-72B-Instruct", + "name": "Qwen2.5 72B Instruct", + "display_name": "Qwen2.5 72B Instruct", "modalities": { "input": [ "text" @@ -33680,63 +32475,58 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 32768, + "output": 32768 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 - }, - "type": "chat" + "input": 0.13, + "output": 0.52 + } }, { - "id": "grok-3-mini", - "name": "xAI Grok 3 Mini", - "display_name": "xAI Grok 3 Mini", + "id": "Qwen/Qwen2.5-VL-72B-Instruct-TEE", + "name": "Qwen2.5 VL 72B Instruct TEE", + "display_name": "Qwen2.5 VL 72B Instruct TEE", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 0.3, - "output": 0.5, - "cache_read": 0.075 - }, - "type": "chat" + "input": 0.15, + "output": 0.6 + } }, { - "id": "sonar-pro", - "name": "Perplexity Sonar Pro", - "display_name": "Perplexity Sonar Pro", + "id": "Qwen/Qwen3-235B-A22B", + "name": "Qwen3 235B A22B", + "display_name": "Qwen3 235B A22B", "modalities": { "input": [ "text" @@ -33746,63 +32536,58 @@ ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 40960, + "output": 40960 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-27", - "last_updated": "2025-01-27", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 3, - "output": 15 - }, - "type": "chat" + "input": 0.3, + "output": 1.2 + } }, { - "id": "gpt-5-mini", - "name": "OpenAI GPT-5 Mini", - "display_name": "OpenAI GPT-5 Mini", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507-TEE", + "name": "Qwen3 235B A22B Instruct 2507 TEE", + "display_name": "Qwen3 235B A22B Instruct 2507 TEE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.024999999999999998 - }, - "type": "chat" + "input": 0.08, + "output": 0.55 + } }, { - "id": "deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "Qwen/Qwen3-32B", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ "text" @@ -33812,8 +32597,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 40960, + "output": 40960 }, "temperature": true, "tool_call": true, @@ -33822,20 +32607,49 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 0.03, - "output": 0.13 + "input": 0.08, + "output": 0.24 + } + }, + { + "id": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "name": "Qwen3 VL 235B A22B Instruct", + "display_name": "Qwen3 VL 235B A22B Instruct", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] }, - "type": "chat" + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", + "cost": { + "input": 0.3, + "output": 1.2 + } }, { - "id": "o1-mini", - "name": "OpenAI: o1-mini", - "display_name": "OpenAI: o1-mini", + "id": "Qwen/Qwen3-Coder-Next", + "name": "Qwen3 Coder Next", + "display_name": "Qwen3 Coder Next", "modalities": { "input": [ "text" @@ -33845,42 +32659,38 @@ ] }, "limit": { - "context": 128000, + "context": 262144, "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 - }, - "type": "chat" + "input": 0.07, + "output": 0.3 + } }, { - "id": "claude-3.7-sonnet", - "name": "Anthropic: Claude 3.7 Sonnet", - "display_name": "Anthropic: Claude 3.7 Sonnet", + "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "name": "Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -33888,34 +32698,29 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-02", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.30000000000000004, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0.08, + "output": 0.33 + } }, { - "id": "claude-3-haiku-20240307", - "name": "Anthropic: Claude 3 Haiku", - "display_name": "Anthropic: Claude 3 Haiku", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8-TEE", + "name": "Qwen3 Coder 480B A35B Instruct FP8 TEE", + "display_name": "Qwen3 Coder 480B A35B Instruct FP8 TEE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -33923,55 +32728,49 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-03-07", - "last_updated": "2024-03-07", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 0.25, - "output": 1.25, - "cache_read": 0.03, - "cache_write": 0.3 - }, - "type": "chat" + "input": 0.22, + "output": 0.95 + } }, { - "id": "o3-pro", - "name": "OpenAI o3 Pro", - "display_name": "OpenAI o3 Pro", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 20, - "output": 80 - }, - "type": "chat" + "input": 0.11, + "output": 0.6 + } }, { - "id": "qwen2.5-coder-7b-fast", - "name": "Qwen2.5 Coder 7B fast", - "display_name": "Qwen2.5 Coder 7B fast", + "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ "text" @@ -33981,29 +32780,27 @@ ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-09-15", - "last_updated": "2024-09-15", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 0.03, - "output": 0.09 - }, - "type": "chat" + "input": 0.1, + "output": 0.8 + } }, { - "id": "deepseek-reasoner", - "name": "DeepSeek Reasoner", - "display_name": "DeepSeek Reasoner", + "id": "miromind-ai/MiroThinker-v1.5-235B", + "name": "MiroThinker V1.5 235B", + "display_name": "MiroThinker V1.5 235B", "modalities": { "input": [ "text" @@ -34013,8 +32810,8 @@ ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": false, @@ -34022,32 +32819,28 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "open_weights": true, + "release_date": "2026-01-10", + "last_updated": "2026-01-10", "cost": { - "input": 0.56, - "output": 1.68, - "cache_read": 0.07 - }, - "type": "chat" + "input": 0.3, + "output": 1.2 + } }, { - "id": "gemini-2.5-pro", - "name": "Google Gemini 2.5 Pro", - "display_name": "Google Gemini 2.5 Pro", + "id": "zai-org/GLM-4.6-TEE", + "name": "GLM 4.6 TEE", + "display_name": "GLM 4.6 TEE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 202752, "output": 65536 }, "temperature": true, @@ -34057,26 +32850,21 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.3125, - "cache_write": 1.25 - }, - "type": "chat" + "input": 0.35, + "output": 1.5 + } }, { - "id": "gemma-3-12b-it", - "name": "Google Gemma 3 12B", - "display_name": "Google Gemma 3 12B", + "id": "zai-org/GLM-4.5-TEE", + "name": "GLM 4.5 TEE", + "display_name": "GLM 4.5 TEE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -34084,28 +32872,27 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 0.049999999999999996, - "output": 0.09999999999999999 - }, - "type": "chat" + "input": 0.35, + "output": 1.55 + } }, { - "id": "mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "zai-org/GLM-4.6V", + "name": "GLM 4.6V", + "display_name": "GLM 4.6V", "modalities": { "input": [ "text", @@ -34116,63 +32903,59 @@ ] }, "limit": { - "context": 128000, - "output": 16400 + "context": 131072, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 20, - "output": 40 - }, - "type": "chat" + "input": 0.3, + "output": 0.9 + } }, { - "id": "o3", - "name": "OpenAI o3", - "display_name": "OpenAI o3", + "id": "zai-org/GLM-4.7-FP8", + "name": "GLM 4.7 FP8", + "display_name": "GLM 4.7 FP8", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 202752, + "output": 65535 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 - }, - "type": "chat" + "input": 0.3, + "output": 1.2 + } }, { - "id": "gpt-oss-20b", - "name": "OpenAI GPT-OSS 20b", - "display_name": "OpenAI GPT-OSS 20b", + "id": "zai-org/GLM-4.6-FP8", + "name": "GLM 4.6 FP8", + "display_name": "GLM 4.6 FP8", "modalities": { "input": [ "text" @@ -34182,8 +32965,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 202752, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -34192,20 +32975,18 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.049999999999999996, - "output": 0.19999999999999998 - }, - "type": "chat" + "input": 0.3, + "output": 1.2 + } }, { - "id": "gpt-oss-120b", - "name": "OpenAI GPT-OSS 120b", - "display_name": "OpenAI GPT-OSS 120b", + "id": "zai-org/GLM-4.7-TEE", + "name": "GLM 4.7 TEE", + "display_name": "GLM 4.7 TEE", "modalities": { "input": [ "text" @@ -34215,8 +32996,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 202752, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -34225,123 +33006,111 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 0.04, - "output": 0.16 - }, - "type": "chat" + "input": 0.4, + "output": 1.5 + } }, { - "id": "claude-3.5-haiku", - "name": "Anthropic: Claude 3.5 Haiku", - "display_name": "Anthropic: Claude 3.5 Haiku", + "id": "zai-org/GLM-4.5-FP8", + "name": "GLM 4.5 FP8", + "display_name": "GLM 4.5 FP8", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.7999999999999999, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 - }, - "type": "chat" + "input": 0.3, + "output": 1.2 + } }, { - "id": "gpt-5-chat-latest", - "name": "OpenAI GPT-5 Chat Latest", - "display_name": "OpenAI GPT-5 Chat Latest", + "id": "zai-org/GLM-4.7-Flash", + "name": "GLM 4.7 Flash", + "display_name": "GLM 4.7 Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 202752, + "output": 65535 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-09-30", - "last_updated": "2024-09-30", + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.12500000000000003 - }, - "type": "chat" + "input": 0.06, + "output": 0.35 + } }, { - "id": "gpt-4o-mini", - "name": "OpenAI GPT-4o-mini", - "display_name": "OpenAI GPT-4o-mini", + "id": "zai-org/GLM-4.5-Air", + "name": "GLM 4.5 Air", + "display_name": "GLM 4.5 Air", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075 - }, - "type": "chat" + "input": 0.05, + "output": 0.22 + } }, { - "id": "gemma2-9b-it", - "name": "Google Gemma 2", - "display_name": "Google Gemma 2", + "id": "deepseek-ai/DeepSeek-V3-0324-TEE", + "name": "DeepSeek V3 0324 TEE", + "display_name": "DeepSeek V3 0324 TEE", "modalities": { "input": [ "text" @@ -34351,65 +33120,58 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 163840, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-25", - "last_updated": "2024-06-25", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 0.01, - "output": 0.03 - }, - "type": "chat" + "input": 0.19, + "output": 0.87 + } }, { - "id": "claude-sonnet-4", - "name": "Anthropic: Claude Sonnet 4", - "display_name": "Anthropic: Claude Sonnet 4", + "id": "deepseek-ai/DeepSeek-V3.2-Speciale-TEE", + "name": "DeepSeek V3.2 Speciale TEE", + "display_name": "DeepSeek V3.2 Speciale TEE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 163840, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-14", - "last_updated": "2025-05-14", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.30000000000000004, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0.27, + "output": 0.41 + } }, { - "id": "sonar-reasoning-pro", - "name": "Perplexity Sonar Reasoning Pro", - "display_name": "Perplexity Sonar Reasoning Pro", + "id": "deepseek-ai/DeepSeek-V3.1-Terminus-TEE", + "name": "DeepSeek V3.1 Terminus TEE", + "display_name": "DeepSeek V3.1 Terminus TEE", "modalities": { "input": [ "text" @@ -34419,131 +33181,120 @@ ] }, "limit": { - "context": 127000, - "output": 4096 + "context": 163840, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-27", - "last_updated": "2025-01-27", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 2, - "output": 8 - }, - "type": "chat" + "input": 0.23, + "output": 0.9 + } }, { - "id": "gpt-5", - "name": "OpenAI GPT-5", - "display_name": "OpenAI GPT-5", + "id": "deepseek-ai/DeepSeek-V3", + "name": "DeepSeek V3", + "display_name": "DeepSeek V3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 163840, + "output": 163840 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.12500000000000003 - }, - "type": "chat" + "input": 0.3, + "output": 1.2 + } }, { - "id": "qwen3-vl-235b-a22b-instruct", - "name": "Qwen3 VL 235B A22B Instruct", - "display_name": "Qwen3 VL 235B A22B Instruct", + "id": "deepseek-ai/DeepSeek-R1-TEE", + "name": "DeepSeek R1 TEE", + "display_name": "DeepSeek R1 TEE", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 163840, + "output": 163840 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { "input": 0.3, - "output": 1.5 - }, - "type": "chat" + "output": 1.2 + } }, { - "id": "qwen3-30b-a3b", - "name": "Qwen3 30B A3B", - "display_name": "Qwen3 30B A3B", + "id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 41000, - "output": 41000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-06-01", - "last_updated": "2025-06-01", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 0.08, - "output": 0.29 - }, - "type": "chat" + "input": 0.03, + "output": 0.11 + } }, { - "id": "deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "deepseek-ai/DeepSeek-R1-0528-TEE", + "name": "DeepSeek R1 0528 TEE", + "display_name": "DeepSeek R1 0528 TEE", "modalities": { "input": [ "text" @@ -34559,58 +33310,53 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 0.27, - "output": 0.41 - }, - "type": "chat" + "input": 0.4, + "output": 1.75 + } }, { - "id": "grok-4-1-fast-non-reasoning", - "name": "xAI Grok 4.1 Fast Non-Reasoning", - "display_name": "xAI Grok 4.1 Fast Non-Reasoning", + "id": "deepseek-ai/DeepSeek-V3.2-TEE", + "name": "DeepSeek V3.2 TEE", + "display_name": "DeepSeek V3.2 TEE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-17", - "last_updated": "2025-11-17", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 0.19999999999999998, - "output": 0.5, - "cache_read": 0.049999999999999996 - }, - "type": "chat" + "input": 0.25, + "output": 0.38 + } }, { - "id": "gpt-5-pro", - "name": "OpenAI: GPT-5 Pro", - "display_name": "OpenAI: GPT-5 Pro", + "id": "deepseek-ai/DeepSeek-V3.1-TEE", + "name": "DeepSeek V3.1 TEE", + "display_name": "DeepSeek V3.1 TEE", "modalities": { "input": [ "text" @@ -34620,61 +33366,73 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 163840, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 15, - "output": 120 - }, - "type": "chat" - }, + "input": 0.2, + "output": 0.8 + } + } + ] + }, + "kimi-for-coding": { + "id": "kimi-for-coding", + "name": "Kimi For Coding", + "display_name": "Kimi For Coding", + "api": "https://api.kimi.com/coding/v1", + "doc": "https://www.kimi.com/coding/docs/en/third-party-agents.html", + "models": [ { - "id": "llama-3.3-70b-versatile", - "name": "Meta Llama 3.3 70B Versatile", - "display_name": "Meta Llama 3.3 70B Versatile", + "id": "k2p5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32678 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.59, - "output": 0.7899999999999999 - }, - "type": "chat" + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } }, { - "id": "mistral-large-2411", - "name": "Mistral-Large", - "display_name": "Mistral-Large", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -34684,29 +33442,40 @@ ] }, "limit": { - "context": 128000, + "context": 262144, "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-24", - "last_updated": "2024-07-24", + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-11", + "last_updated": "2025-12", "cost": { - "input": 2, - "output": 6 - }, - "type": "chat" - }, + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } + } + ] + }, + "cortecs": { + "id": "cortecs", + "name": "Cortecs", + "display_name": "Cortecs", + "api": "https://api.cortecs.ai/v1", + "doc": "https://api.cortecs.ai/v1/models", + "models": [ { - "id": "claude-opus-4-1-20250805", - "name": "Anthropic: Claude Opus 4.1 (20250805)", - "display_name": "Anthropic: Claude Opus 4.1 (20250805)", + "id": "nova-pro-v1", + "name": "Nova Pro 1.0", + "display_name": "Nova Pro 1.0", "modalities": { "input": [ "text", @@ -34717,32 +33486,28 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 300000, + "output": 5000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-08", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2024-04", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" + "input": 1.016, + "output": 4.061 + } }, { - "id": "ernie-4.5-21b-a3b-thinking", - "name": "Baidu Ernie 4.5 21B A3B Thinking", - "display_name": "Baidu Ernie 4.5 21B A3B Thinking", + "id": "devstral-2512", + "name": "Devstral 2 2512", + "display_name": "Devstral 2 2512", "modalities": { "input": [ "text" @@ -34752,76 +33517,73 @@ ] }, "limit": { - "context": 128000, - "output": 8000 + "context": 262000, + "output": 262000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-03-16", - "last_updated": "2025-03-16", + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", "cost": { - "input": 0.07, - "output": 0.28 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "gpt-5.1-chat-latest", - "name": "OpenAI GPT-5.1 Chat", - "display_name": "OpenAI GPT-5.1 Chat", + "id": "intellect-3", + "name": "INTELLECT 3", + "display_name": "INTELLECT 3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { "context": 128000, - "output": 16384 + "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": true, + "knowledge": "2025-11", + "release_date": "2025-11-26", + "last_updated": "2025-11-26", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.12500000000000003 - }, - "type": "chat" + "input": 0.219, + "output": 1.202 + } }, { - "id": "qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "claude-4-5-sonnet", + "name": "Claude 4.5 Sonnet", + "display_name": "Claude 4.5 Sonnet", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 40960 + "context": 200000, + "output": 200000 }, "temperature": true, "tool_call": true, @@ -34829,33 +33591,31 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.29, - "output": 0.59 - }, - "type": "chat" + "input": 3.259, + "output": 16.296 + } }, { - "id": "claude-haiku-4-5-20251001", - "name": "Anthropic: Claude 4.5 Haiku (20251001)", - "display_name": "Anthropic: Claude 4.5 Haiku (20251001)", + "id": "deepseek-v3-0324", + "name": "DeepSeek V3 0324", + "display_name": "DeepSeek V3 0324", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -34863,64 +33623,51 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-10", - "release_date": "2025-10-01", - "last_updated": "2025-10-01", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.09999999999999999, - "cache_write": 1.25 - }, - "type": "chat" + "input": 0.551, + "output": 1.654 + } }, { - "id": "llama-4-scout", - "name": "Meta Llama 4 Scout 17B 16E", - "display_name": "Meta Llama 4 Scout 17B 16E", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0.08, - "output": 0.3 - }, - "type": "chat" - } - ] - }, - "huggingface": { - "id": "huggingface", - "name": "Hugging Face", - "display_name": "Hugging Face", - "api": "https://router.huggingface.co/v1", - "doc": "https://huggingface.co/docs/inference-providers", - "models": [ + "input": 0.656, + "output": 2.731 + } + }, { - "id": "moonshotai/Kimi-K2-Instruct", - "name": "Kimi-K2-Instruct", - "display_name": "Kimi-K2-Instruct", + "id": "kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ "text" @@ -34930,8 +33677,8 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -34940,30 +33687,30 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-14", - "last_updated": "2025-07-14", + "knowledge": "2024-07", + "release_date": "2025-07-11", + "last_updated": "2025-09-05", "cost": { - "input": 1, - "output": 3 - }, - "type": "chat" + "input": 0.551, + "output": 2.646 + } }, { - "id": "moonshotai/Kimi-K2-Instruct-0905", - "name": "Kimi-K2-Instruct-0905", - "display_name": "Kimi-K2-Instruct-0905", + "id": "gpt-4.1", + "name": "GPT 4.1", + "display_name": "GPT 4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -34971,54 +33718,51 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-04", - "last_updated": "2025-09-04", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 1, - "output": 3 - }, - "type": "chat" + "input": 2.354, + "output": 9.417 + } }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "Kimi-K2-Thinking", - "display_name": "Kimi-K2-Thinking", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 65535 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-17", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 - }, - "type": "chat" + "input": 1.654, + "output": 11.024 + } }, { - "id": "MiniMaxAI/MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "gpt-oss-120b", + "name": "GPT Oss 120b", + "display_name": "GPT Oss 120b", "modalities": { "input": [ "text" @@ -35028,63 +33772,60 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-10", - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "knowledge": "2024-01", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.3, - "output": 1.2 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "XiaomiMiMo/MiMo-V2-Flash", - "name": "MiMo-V2-Flash", - "display_name": "MiMo-V2-Flash", + "id": "devstral-small-2512", + "name": "Devstral Small 2 2512", + "display_name": "Devstral Small 2 2512", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 4096 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", "cost": { - "input": 0.1, - "output": 0.3 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "Qwen/Qwen3-Embedding-8B", - "name": "Qwen 3 Embedding 8B", - "display_name": "Qwen 3 Embedding 8B", + "id": "qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" @@ -35094,61 +33835,61 @@ ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 262000, + "output": 262000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-01", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 0.01, - "output": 0 - }, - "type": "embedding" + "input": 0.441, + "output": 1.984 + } }, { - "id": "Qwen/Qwen3-Embedding-4B", - "name": "Qwen 3 Embedding 4B", - "display_name": "Qwen 3 Embedding 4B", + "id": "claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 2048 + "context": 200000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": false, + "knowledge": "2025-03", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.01, - "output": 0 - }, - "type": "embedding" + "input": 3.307, + "output": 16.536 + } }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "name": "Qwen3-Coder-480B-A35B-Instruct", - "display_name": "Qwen3-Coder-480B-A35B-Instruct", + "id": "llama-3.1-405b-instruct", + "name": "Llama 3.1 405B Instruct", + "display_name": "Llama 3.1 405B Instruct", "modalities": { "input": [ "text" @@ -35158,8 +33899,8 @@ ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -35168,19 +33909,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 2, - "output": 2 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3-235B-A22B-Thinking-2507", - "display_name": "Qwen3-235B-A22B-Thinking-2507", + "id": "qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ "text" @@ -35190,8 +33930,8 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -35202,18 +33942,17 @@ "attachment": false, "open_weights": true, "knowledge": "2025-04", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "release_date": "2025-09-11", + "last_updated": "2025-09-11", "cost": { - "input": 0.3, - "output": 3 - }, - "type": "chat" + "input": 0.164, + "output": 1.311 + } }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "name": "Qwen3-Next-80B-A3B-Instruct", - "display_name": "Qwen3-Next-80B-A3B-Instruct", + "id": "qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ "text" @@ -35223,8 +33962,8 @@ ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 16384, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -35233,19 +33972,27 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-11", - "last_updated": "2025-09-11", + "knowledge": "2024-12", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 0.25, - "output": 1 - }, - "type": "chat" - }, + "input": 0.099, + "output": 0.33 + } + } + ] + }, + "github-models": { + "id": "github-models", + "name": "GitHub Models", + "display_name": "GitHub Models", + "api": "https://models.github.ai/inference", + "doc": "https://docs.github.com/en/github-models", + "models": [ { - "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", - "name": "Qwen3-Next-80B-A3B-Thinking", - "display_name": "Qwen3-Next-80B-A3B-Thinking", + "id": "core42/jais-30b-chat", + "name": "JAIS 30b Chat", + "display_name": "JAIS 30b Chat", "modalities": { "input": [ "text" @@ -35255,29 +34002,29 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 8192, + "output": 2048 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-11", - "last_updated": "2025-09-11", + "knowledge": "2023-03", + "release_date": "2023-08-30", + "last_updated": "2023-08-30", "cost": { - "input": 0.3, - "output": 2 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "zai-org/GLM-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "xai/grok-3", + "name": "Grok 3", + "display_name": "Grok 3", "modalities": { "input": [ "text" @@ -35287,8 +34034,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -35297,21 +34044,19 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-12-09", + "last_updated": "2024-12-09", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek-R1-0528", - "display_name": "DeepSeek-R1-0528", + "id": "xai/grok-3-mini", + "name": "Grok 3 Mini", + "display_name": "Grok 3 Mini", "modalities": { "input": [ "text" @@ -35321,8 +34066,8 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -35331,20 +34076,19 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", - "cost": { - "input": 3, - "output": 5 - }, - "type": "chat" + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-12-09", + "last_updated": "2024-12-09", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "deepseek-ai/DeepSeek-V3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "cohere/cohere-command-r-08-2024", + "name": "Cohere Command R 08-2024", + "display_name": "Cohere Command R 08-2024", "modalities": { "input": [ "text" @@ -35354,8 +34098,8 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -35364,29 +34108,19 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2024-08-01", + "last_updated": "2024-08-01", "cost": { - "input": 0.28, - "output": 0.4 - }, - "type": "chat" - } - ] - }, - "opencode": { - "id": "opencode", - "name": "OpenCode Zen", - "display_name": "OpenCode Zen", - "api": "https://opencode.ai/zen/v1", - "doc": "https://opencode.ai/docs/zen", - "models": [ + "input": 0, + "output": 0 + } + }, { - "id": "qwen3-coder", - "name": "Qwen3 Coder", - "display_name": "Qwen3 Coder", + "id": "cohere/cohere-command-a", + "name": "Cohere Command A", + "display_name": "Cohere Command A", "modalities": { "input": [ "text" @@ -35396,42 +34130,40 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.45, - "output": 1.8 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "claude-opus-4-1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "cohere/cohere-command-r-plus-08-2024", + "name": "Cohere Command R+ 08-2024", + "display_name": "Cohere Command R+ 08-2024", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -35439,23 +34171,20 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2024-03", + "release_date": "2024-08-01", + "last_updated": "2024-08-01", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "kimi-k2", - "name": "Kimi K2", - "display_name": "Kimi K2", + "id": "cohere/cohere-command-r", + "name": "Cohere Command R", + "display_name": "Cohere Command R", "modalities": { "input": [ "text" @@ -35465,78 +34194,40 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", - "cost": { - "input": 0.4, - "output": 2.5, - "cache_read": 0.4 - }, - "type": "chat" - }, - { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 400000, - "output": 128000 - }, - "temperature": false, - "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2024-03", + "release_date": "2024-03-11", + "last_updated": "2024-08-01", "cost": { - "input": 1.07, - "output": 8.5, - "cache_read": 0.107 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "cohere/cohere-command-r-plus", + "name": "Cohere Command R+", + "display_name": "Cohere Command R+", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -35544,36 +34235,31 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2024-03", + "release_date": "2024-04-04", + "last_updated": "2024-08-01", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "deepseek/deepseek-r1-0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 65536, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -35581,38 +34267,31 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "gemini-3-pro", - "name": "Gemini 3 Pro", - "display_name": "Gemini 3 Pro", + "id": "deepseek/deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 65536, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -35620,27 +34299,20 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "alpha-glm-4.7", - "name": "Alpha GLM-4.7", - "display_name": "Alpha GLM-4.7", + "id": "deepseek/deepseek-v3-0324", + "name": "DeepSeek-V3-0324", + "display_name": "DeepSeek-V3-0324", "modalities": { "input": [ "text" @@ -35650,8 +34322,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -35661,33 +34333,30 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "knowledge": "2024-06", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.6 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "mistral-ai/mistral-medium-2505", + "name": "Mistral Medium 3 (25.05)", + "display_name": "Mistral Medium 3 (25.05)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -35695,64 +34364,52 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2024-09", + "release_date": "2025-05-01", + "last_updated": "2025-05-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, - "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.6, - "cache_write": 7.5 - } - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex Mini", - "display_name": "GPT-5.1 Codex Mini", + "id": "mistral-ai/ministral-3b", + "name": "Ministral 3B", + "display_name": "Ministral 3B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": false, + "open_weights": true, + "knowledge": "2024-03", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "alpha-gd4", - "name": "Alpha GD4", - "display_name": "Alpha GD4", + "id": "mistral-ai/mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text" @@ -35762,8 +34419,8 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -35773,20 +34430,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2024-03", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.5, - "output": 2, - "cache_read": 0.15 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "mistral-ai/mistral-large-2411", + "name": "Mistral Large 24.11", + "display_name": "Mistral Large 24.11", "modalities": { "input": [ "text" @@ -35796,8 +34451,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -35806,56 +34461,51 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "open_weights": false, + "knowledge": "2024-09", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.4, - "output": 2.5, - "cache_read": 0.4 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "mistral-ai/codestral-2501", + "name": "Codestral 25.01", + "display_name": "Codestral 25.01", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2024-03", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1.07, - "output": 8.5, - "cache_read": 0.107 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "mistral-ai/mistral-small-2503", + "name": "Mistral Small 3.1", + "display_name": "Mistral Small 3.1", "modalities": { "input": [ "text", @@ -35866,66 +34516,61 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-09", + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { "input": 0, - "output": 0, - "cache_read": 0 - }, - "type": "chat" + "output": 0 + } }, { - "id": "gpt-5-codex", - "name": "GPT-5 Codex", - "display_name": "GPT-5 Codex", + "id": "microsoft/phi-3-medium-128k-instruct", + "name": "Phi-3-medium instruct (128k)", + "display_name": "Phi-3-medium instruct (128k)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 1.07, - "output": 8.5, - "cache_read": 0.107 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "big-pickle", - "name": "Big Pickle", - "display_name": "Big Pickle", + "id": "microsoft/phi-3-mini-4k-instruct", + "name": "Phi-3-mini instruct (4k)", + "display_name": "Phi-3-mini instruct (4k)", "modalities": { "input": [ "text" @@ -35935,8 +34580,8 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 4096, + "output": 1024 }, "temperature": true, "tool_call": true, @@ -35945,58 +34590,19 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-10-17", - "last_updated": "2025-10-17", - "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, - "type": "chat" - }, - { - "id": "claude-3-5-haiku", - "name": "Claude Haiku 3.5", - "display_name": "Claude Haiku 3.5", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 200000, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "microsoft/phi-3-small-128k-instruct", + "name": "Phi-3-small instruct (128k)", + "display_name": "Phi-3-small instruct (128k)", "modalities": { "input": [ "text" @@ -36006,8 +34612,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -36017,31 +34623,30 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.1 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "glm-4.7-free", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "microsoft/phi-3.5-vision-instruct", + "name": "Phi-3.5-vision instruct (128k)", + "display_name": "Phi-3.5-vision instruct (128k)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -36051,20 +34656,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { "input": 0, - "output": 0, - "cache_read": 0 - }, - "type": "chat" + "output": 0 + } }, { - "id": "grok-code", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "microsoft/phi-4", + "name": "Phi-4", + "display_name": "Phi-4", "modalities": { "input": [ "text" @@ -36074,8 +34677,8 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 16000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -36083,37 +34686,31 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-20", - "last_updated": "2025-08-20", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, - "type": "chat" + "output": 0 + } }, { - "id": "gemini-3-flash", - "name": "Gemini 3 Flash", - "display_name": "Gemini 3 Flash", + "id": "microsoft/phi-4-mini-reasoning", + "name": "Phi-4-mini-reasoning", + "display_name": "Phi-4-mini-reasoning", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -36121,57 +34718,52 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "gpt-5.1-codex-max", - "name": "GPT-5.1 Codex Max", - "display_name": "GPT-5.1 Codex Max", + "id": "microsoft/phi-3-small-8k-instruct", + "name": "Phi-3-small instruct (8k)", + "display_name": "Phi-3-small instruct (8k)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 8192, + "output": 2048 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "minimax-m2.1-free", - "name": "MiniMax M2.1", - "display_name": "MiniMax M2.1", + "id": "microsoft/phi-3.5-mini-instruct", + "name": "Phi-3.5-mini instruct (128k)", + "display_name": "Phi-3.5-mini instruct (128k)", "modalities": { "input": [ "text" @@ -36181,8 +34773,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -36192,33 +34784,31 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { "input": 0, - "output": 0, - "cache_read": 0 - }, - "type": "chat" + "output": 0 + } }, { - "id": "claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "microsoft/phi-4-multimodal-instruct", + "name": "Phi-4-multimodal-instruct", + "display_name": "Phi-4-multimodal-instruct", "modalities": { "input": [ "text", "image", - "pdf" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -36226,108 +34816,84 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, - "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.6, - "cache_write": 7.5 - } - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "microsoft/phi-3-mini-128k-instruct", + "name": "Phi-3-mini instruct (128k)", + "display_name": "Phi-3-mini instruct (128k)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 1.07, - "output": 8.5, - "cache_read": 0.107 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "microsoft/phi-3.5-moe-instruct", + "name": "Phi-3.5-MoE instruct (128k)", + "display_name": "Phi-3.5-MoE instruct (128k)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 - }, - "type": "chat" - } - ] - }, - "fastrouter": { - "id": "fastrouter", - "name": "FastRouter", - "display_name": "FastRouter", - "api": "https://go.fastrouter.ai/api/v1", - "doc": "https://fastrouter.ai/models", - "models": [ + "input": 0, + "output": 0 + } + }, { - "id": "moonshotai/kimi-k2", - "name": "Kimi K2", - "display_name": "Kimi K2", + "id": "microsoft/phi-4-mini-instruct", + "name": "Phi-4-mini-instruct", + "display_name": "Phi-4-mini-instruct", "modalities": { "input": [ "text" @@ -36337,29 +34903,29 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-11", - "last_updated": "2025-07-11", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.55, - "output": 2.2 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "x-ai/grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "microsoft/phi-3-medium-4k-instruct", + "name": "Phi-3-medium instruct (4k)", + "display_name": "Phi-3-medium instruct (4k)", "modalities": { "input": [ "text" @@ -36369,8 +34935,8 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 4096, + "output": 1024 }, "temperature": true, "tool_call": true, @@ -36379,35 +34945,30 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75, - "cache_write": 15 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "microsoft/phi-4-reasoning", + "name": "Phi-4-Reasoning", + "display_name": "Phi-4-Reasoning", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -36415,35 +34976,31 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.0375 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "google/gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "microsoft/mai-ds-r1", + "name": "MAI-DS-R1", + "display_name": "MAI-DS-R1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 65536, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -36451,22 +35008,20 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2024-06", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "openai/gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "openai/gpt-4.1-nano", + "name": "GPT-4.1-nano", + "display_name": "GPT-4.1-nano", "modalities": { "input": [ "text", @@ -36477,31 +35032,28 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-10-01", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1-mini", + "display_name": "GPT-4.1-mini", "modalities": { "input": [ "text", @@ -36512,8 +35064,8 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -36526,51 +35078,46 @@ "release_date": "2025-04-14", "last_updated": "2025-04-14", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "openai/gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "openai/o1-preview", + "name": "OpenAI o1-preview", + "display_name": "OpenAI o1-preview", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10-01", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2023-10", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "openai/o3-mini", + "name": "OpenAI o3-mini", + "display_name": "OpenAI o3-mini", "modalities": { "input": [ "text" @@ -36580,61 +35127,62 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.05, - "output": 0.2 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": true, + "open_weights": false, + "knowledge": "2023-10", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 0.15, - "output": 0.6 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "openai/gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ "text", @@ -36645,68 +35193,65 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-10-01", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "qwen/qwen3-coder", - "name": "Qwen3 Coder", - "display_name": "Qwen3 Coder", + "id": "openai/o4-mini", + "name": "OpenAI o4-mini", + "display_name": "OpenAI o4-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.3, - "output": 1.2 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "anthropic/claude-opus-4.1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "openai/o1", + "name": "OpenAI o1", + "display_name": "OpenAI o1", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -36714,153 +35259,139 @@ }, "limit": { "context": 200000, - "output": 32000 + "output": 100000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2023-10", + "release_date": "2024-09-12", + "last_updated": "2024-12-17", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "anthropic/claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "openai/o1-mini", + "name": "OpenAI o1-mini", + "display_name": "OpenAI o1-mini", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2023-10", + "release_date": "2024-09-12", + "last_updated": "2024-12-17", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "deepseek-ai/deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "openai/o3", + "name": "OpenAI o3", + "display_name": "OpenAI o3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-01-23", - "last_updated": "2025-01-23", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.03, - "output": 0.14 - }, - "type": "chat" - } - ] - }, - "minimax": { - "id": "minimax", - "name": "MiniMax", - "display_name": "MiniMax", - "api": "https://api.minimax.io/anthropic/v1", - "doc": "https://platform.minimax.io/docs/guides/quickstart", - "models": [ + "input": 0, + "output": 0 + } + }, { - "id": "MiniMax-M2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 128000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "attachment": true, + "open_weights": false, + "knowledge": "2023-10", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.3, - "output": 1.2 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "meta/llama-3.2-11b-vision-instruct", + "name": "Llama-3.2-11B-Vision-Instruct", + "display_name": "Llama-3.2-11B-Vision-Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -36870,26 +35401,18 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.3, - "output": 1.2 - }, - "type": "chat" - } - ] - }, - "google": { - "id": "google", - "name": "google", - "display_name": "google", - "doc": "https://ai.google.dev/gemini-api/docs/pricing", - "models": [ + "input": 0, + "output": 0 + } + }, { - "id": "gemini-embedding-001", - "name": "Gemini Embedding 001", - "display_name": "Gemini Embedding 001", + "id": "meta/meta-llama-3.1-405b-instruct", + "name": "Meta-Llama-3.1-405B-Instruct", + "display_name": "Meta-Llama-3.1-405B-Instruct", "modalities": { "input": [ "text" @@ -36899,44 +35422,41 @@ ] }, "limit": { - "context": 2048, - "output": 3072 + "context": 128000, + "output": 32768 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.15, + "input": 0, "output": 0 - }, - "type": "embedding" + } }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "meta/llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama 4 Maverick 17B 128E Instruct FP8", + "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -36944,77 +35464,63 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "context_over_200k": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 - } - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "gemini-2.5-flash-image", - "name": "Gemini 2.5 Flash Image", - "display_name": "Gemini 2.5 Flash Image", + "id": "meta/meta-llama-3-70b-instruct", + "name": "Meta-Llama-3-70B-Instruct", + "display_name": "Meta-Llama-3-70B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 8192, + "output": 2048 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 0.3, - "output": 30, - "cache_read": 0.075 - }, - "type": "imageGeneration" + "input": 0, + "output": 0 + } }, { - "id": "gemini-2.5-flash-preview-05-20", - "name": "Gemini 2.5 Flash Preview 05-20", - "display_name": "Gemini 2.5 Flash Preview 05-20", + "id": "meta/meta-llama-3.1-70b-instruct", + "name": "Meta-Llama-3.1-70B-Instruct", + "display_name": "Meta-Llama-3.1-70B-Instruct", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -37022,37 +35528,31 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.0375 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "gemini-flash-lite-latest", - "name": "Gemini Flash-Lite Latest", - "display_name": "Gemini Flash-Lite Latest", + "id": "meta/llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -37060,37 +35560,33 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "meta/llama-3.2-90b-vision-instruct", + "name": "Llama-3.2-90B-Vision-Instruct", + "display_name": "Llama-3.2-90B-Vision-Instruct", "modalities": { "input": [ "text", "image", - "video", - "audio", - "pdf" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -37098,87 +35594,64 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } - }, - "type": "chat" - }, + "input": 0, + "output": 0 + } + }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "meta/meta-llama-3-8b-instruct", + "name": "Meta-Llama-3-8B-Instruct", + "display_name": "Meta-Llama-3-8B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 8192, + "output": 2048 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": -1, - "min": 0, - "max": 24576 - } - }, - "search": { - "supported": true, - "default": false + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "input_audio": 1 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "gemini-flash-latest", - "name": "Gemini Flash Latest", - "display_name": "Gemini Flash Latest", + "id": "meta/llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17B 16E Instruct", + "display_name": "Llama 4 Scout 17B 16E Instruct", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -37186,38 +35659,31 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "input_audio": 1 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "gemini-2.5-pro-preview-05-06", - "name": "Gemini 2.5 Pro Preview 05-06", - "display_name": "Gemini 2.5 Pro Preview 05-06", + "id": "meta/meta-llama-3.1-8b-instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "display_name": "Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -37225,128 +35691,123 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-05-06", - "last_updated": "2025-05-06", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "gemini-2.5-flash-preview-tts", - "name": "Gemini 2.5 Flash Preview TTS", - "display_name": "Gemini 2.5 Flash Preview TTS", + "id": "ai21-labs/ai21-jamba-1.5-large", + "name": "AI21 Jamba 1.5 Large", + "display_name": "AI21 Jamba 1.5 Large", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8000, - "output": 16000 + "context": 256000, + "output": 4096 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-05-01", - "last_updated": "2025-05-01", + "knowledge": "2024-03", + "release_date": "2024-08-29", + "last_updated": "2024-08-29", "cost": { - "input": 0.5, - "output": 10 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "gemini-2.0-flash-lite", - "name": "Gemini 2.0 Flash Lite", - "display_name": "Gemini 2.0 Flash Lite", + "id": "ai21-labs/ai21-jamba-1.5-mini", + "name": "AI21 Jamba 1.5 Mini", + "display_name": "AI21 Jamba 1.5 Mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 256000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "search": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2024-03", + "release_date": "2024-08-29", + "last_updated": "2024-08-29", "cost": { - "input": 0.075, - "output": 0.3 - }, - "type": "chat" - }, + "input": 0, + "output": 0 + } + } + ] + }, + "togetherai": { + "id": "togetherai", + "name": "Together AI", + "display_name": "Together AI", + "doc": "https://docs.together.ai/docs/serverless-models", + "models": [ { - "id": "gemini-live-2.5-flash-preview-native-audio", - "name": "Gemini Live 2.5 Flash Preview Native Audio", - "display_name": "Gemini Live 2.5 Flash Preview Native Audio", + "id": "moonshotai/Kimi-K2-Instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ - "text", - "audio", - "video" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { "context": 131072, - "output": 65536 + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-09-18", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-14", + "last_updated": "2025-07-14", "cost": { - "input": 0.5, - "output": 2, - "input_audio": 3, - "output_audio": 12 - }, - "type": "chat" + "input": 1, + "output": 3 + } }, { - "id": "gemini-2.0-flash", - "name": "Gemini 2.0 Flash", - "display_name": "Gemini 2.0 Flash", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", @@ -37357,94 +35818,71 @@ ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "search": { - "supported": true, - "default": false + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "attachment": false, + "open_weights": true, + "knowledge": "2026-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 - }, - "type": "chat" + "input": 0.5, + "output": 2.8 + } }, { - "id": "gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash Lite", - "display_name": "Gemini 2.5 Flash Lite", + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "Kimi K2 Instruct-0905", + "display_name": "Kimi K2 Instruct-0905", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": -1, - "min": 512, - "max": 24576 - } - }, - "search": { - "supported": true, - "default": false + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "attachment": false, + "open_weights": true, + "knowledge": "2025-09", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 - }, - "type": "chat" + "input": 1, + "output": 3 + } }, { - "id": "gemini-2.5-pro-preview-06-05", - "name": "Gemini 2.5 Pro Preview 06-05", - "display_name": "Gemini 2.5 Pro Preview 06-05", + "id": "moonshotai/Kimi-K2-Thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -37452,76 +35890,62 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 - }, - "type": "chat" + "input": 1.2, + "output": 4 + } }, { - "id": "gemini-live-2.5-flash", - "name": "Gemini Live 2.5 Flash", - "display_name": "Gemini Live 2.5 Flash", + "id": "essentialai/Rnj-1-Instruct", + "name": "Rnj-1 Instruct", + "display_name": "Rnj-1 Instruct", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 128000, - "output": 8000 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-01", - "last_updated": "2025-09-01", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-12-05", + "last_updated": "2025-12-05", "cost": { - "input": 0.5, - "output": 2, - "input_audio": 3, - "output_audio": 12 - }, - "type": "chat" + "input": 0.15, + "output": 0.15 + } }, { - "id": "gemini-2.5-flash-lite-preview-06-17", - "name": "Gemini 2.5 Flash Lite Preview 06-17", - "display_name": "Gemini 2.5 Flash Lite Preview 06-17", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -37529,534 +35953,450 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "attachment": false, + "open_weights": true, + "knowledge": "2025-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025, - "input_audio": 0.3 - }, - "type": "chat" + "input": 0.15, + "output": 0.6 + } }, { - "id": "gemini-2.5-flash-image-preview", - "name": "Gemini 2.5 Flash Image Preview", - "display_name": "Gemini 2.5 Flash Image Preview", + "id": "meta-llama/Llama-3.3-70B-Instruct-Turbo", + "name": "Llama 3.3 70B", + "display_name": "Llama 3.3 70B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 131072, + "output": 66536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.3, - "output": 30, - "cache_read": 0.075 - }, - "type": "imageGeneration" + "input": 0.88, + "output": 0.88 + } }, { - "id": "gemini-2.5-flash-preview-09-2025", - "name": "Gemini 2.5 Flash Preview 09 2025", - "display_name": "Gemini 2.5 Flash Preview 09 2025", + "id": "Qwen/Qwen3-Coder-Next-FP8", + "name": "Qwen3 Coder Next FP8", + "display_name": "Qwen3 Coder Next FP8", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262144, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": -1, - "min": 0, - "max": 24576 - } - }, - "search": { - "supported": true, - "default": false + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "attachment": false, + "open_weights": true, + "knowledge": "2026-02-03", + "release_date": "2026-02-03", + "last_updated": "2026-02-03", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "input_audio": 1 - }, - "type": "chat" + "input": 0.5, + "output": 1.2 + } }, { - "id": "gemini-2.5-flash-preview-04-17", - "name": "Gemini 2.5 Flash Preview 04-17", - "display_name": "Gemini 2.5 Flash Preview 04-17", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262144, + "output": 66536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-04-17", - "last_updated": "2025-04-17", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.0375 - }, - "type": "chat" - }, + "input": 2, + "output": 2 + } + }, { - "id": "gemini-2.5-pro-preview-tts", - "name": "Gemini 2.5 Pro Preview TTS", - "display_name": "Gemini 2.5 Pro Preview TTS", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507-tput", + "name": "Qwen3 235B A22B Instruct 2507 FP8", + "display_name": "Qwen3 235B A22B Instruct 2507 FP8", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8000, - "output": 16000 + "context": 262144, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-05-01", - "last_updated": "2025-05-01", + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 1, - "output": 20 - }, - "type": "chat" + "input": 0.2, + "output": 0.6 + } }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen3-Next-80B-A3B-Instruct", + "display_name": "Qwen3-Next-80B-A3B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": -1, - "min": 128, - "max": 32768 - } - }, - "search": { - "supported": true, - "default": false + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 - }, - "type": "chat" + "input": 0.15, + "output": 1.5 + } }, { - "id": "gemini-1.5-flash", - "name": "Gemini 1.5 Flash", - "display_name": "Gemini 1.5 Flash", + "id": "zai-org/GLM-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-05-14", - "last_updated": "2024-05-14", + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 0.075, - "output": 0.3, - "cache_read": 0.01875 - }, - "type": "chat" + "input": 0.45, + "output": 2 + } }, { - "id": "gemini-1.5-flash-8b", - "name": "Gemini 1.5 Flash-8B", - "display_name": "Gemini 1.5 Flash-8B", + "id": "zai-org/GLM-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 200000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-10-03", - "last_updated": "2024-10-03", + "attachment": false, + "open_weights": true, + "knowledge": "2025-09", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.0375, - "output": 0.15, - "cache_read": 0.01 - }, - "type": "chat" + "input": 0.6, + "output": 2.2 + } }, { - "id": "gemini-2.5-flash-lite-preview-09-2025", - "name": "Gemini 2.5 Flash Lite Preview 09 2025", - "display_name": "Gemini 2.5 Flash Lite Preview 09 2025", + "id": "deepseek-ai/DeepSeek-R1", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 163839, + "output": 12288 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": -1, - "min": 512, - "max": 24576 - } - }, - "search": { - "supported": true, - "default": false + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2024-12-26", + "last_updated": "2025-03-24", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 - }, - "type": "chat" + "input": 3, + "output": 7 + } }, { - "id": "gemini-1.5-pro", - "name": "Gemini 1.5 Pro", - "display_name": "Gemini 1.5 Pro", + "id": "deepseek-ai/DeepSeek-V3", + "name": "DeepSeek V3", + "display_name": "DeepSeek V3", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 131072, + "output": 12288 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-02-15", - "last_updated": "2024-02-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-29", "cost": { "input": 1.25, - "output": 5, - "cache_read": 0.3125 - }, - "type": "chat" + "output": 1.25 + } }, { - "id": "gemini-2.0-flash-preview-image-generation", - "name": "Gemini 2.0 Flash Preview Image Generation", - "display_name": "Gemini 2.0 Flash Preview Image Generation", + "id": "deepseek-ai/DeepSeek-V3-1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 131072, + "output": 12288 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false - }, - "search": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-08", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", + "cost": { + "input": 0.6, + "output": 1.7 + } } ] }, - "google-vertex": { - "id": "google-vertex", - "name": "Vertex", - "display_name": "Vertex", - "doc": "https://cloud.google.com/vertex-ai/generative-ai/docs/models", + "azure": { + "id": "azure", + "name": "Azure", + "display_name": "Azure", + "doc": "https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models", "models": [ { - "id": "gemini-embedding-001", - "name": "Gemini Embedding 001", - "display_name": "Gemini Embedding 001", + "id": "gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 2048, - "output": 3072 + "context": 1047576, + "output": 32768 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "knowledge": "2024-05", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.15, - "output": 0 - }, - "type": "embedding" + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 + } }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "text-embedding-3-small", + "name": "text-embedding-3-small", + "display_name": "text-embedding-3-small", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 8191, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "context_over_200k": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 - } - }, - "type": "chat" + "input": 0.02, + "output": 0 + } }, { - "id": "gemini-2.5-flash-preview-05-20", - "name": "Gemini 2.5 Flash Preview 05-20", - "display_name": "Gemini 2.5 Flash Preview 05-20", + "id": "grok-4-fast-non-reasoning", + "name": "Grok 4 Fast (Non-Reasoning)", + "display_name": "Grok 4 Fast (Non-Reasoning)", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.0375 - }, - "type": "chat" + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + } }, { - "id": "gemini-flash-lite-latest", - "name": "Gemini Flash-Lite Latest", - "display_name": "Gemini Flash-Lite Latest", + "id": "deepseek-r1-0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, @@ -38064,37 +36404,32 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 - }, - "type": "chat" + "input": 1.35, + "output": 5.4 + } }, { - "id": "gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "grok-4-fast-reasoning", + "name": "Grok 4 Fast (Reasoning)", + "display_name": "Grok 4 Fast (Reasoning)", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -38104,109 +36439,85 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } - }, - "type": "chat" + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + } }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "phi-3-medium-128k-instruct", + "name": "Phi-3-medium-instruct (128k)", + "display_name": "Phi-3-medium-instruct (128k)", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.383 - }, - "type": "chat" + "input": 0.17, + "output": 0.68 + } }, { - "id": "gemini-flash-latest", - "name": "Gemini Flash Latest", - "display_name": "Gemini Flash Latest", + "id": "gpt-4", + "name": "GPT-4", + "display_name": "GPT-4", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", - "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.383 - }, - "type": "chat" + "knowledge": "2023-11", + "release_date": "2023-03-14", + "last_updated": "2023-03-14", + "cost": { + "input": 60, + "output": 120 + } }, { - "id": "gemini-2.5-pro-preview-05-06", - "name": "Gemini 2.5 Pro Preview 05-06", - "display_name": "Gemini 2.5 Pro Preview 05-06", + "id": "claude-opus-4-1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -38214,8 +36525,8 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -38225,70 +36536,65 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-05-06", - "last_updated": "2025-05-06", + "knowledge": "2025-03-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 - }, - "type": "chat" + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } }, { - "id": "gemini-2.0-flash-lite", - "name": "Gemini 2.0 Flash Lite", - "display_name": "Gemini 2.0 Flash Lite", + "id": "gpt-5.2-chat", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.075, - "output": 0.3 - }, - "type": "chat" + "input": 1.75, + "output": 14, + "cache_read": 0.175 + } }, { - "id": "gemini-2.0-flash", - "name": "Gemini 2.0 Flash", - "display_name": "Gemini 2.0 Flash", + "id": "llama-3.2-11b-vision-instruct", + "name": "Llama-3.2-11B-Vision-Instruct", + "display_name": "Llama-3.2-11B-Vision-Instruct", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 128000, "output": 8192 }, "temperature": true, @@ -38297,74 +36603,61 @@ "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 - }, - "type": "chat" + "input": 0.37, + "output": 0.37 + } }, { - "id": "gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash Lite", - "display_name": "Gemini 2.5 Flash Lite", + "id": "cohere-embed-v-4-0", + "name": "Embed v4", + "display_name": "Embed v4", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "open_weights": true, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 - }, - "type": "chat" + "input": 0.12, + "output": 0 + } }, { - "id": "gemini-2.5-pro-preview-06-05", - "name": "Gemini 2.5 Pro Preview 06-05", - "display_name": "Gemini 2.5 Pro Preview 06-05", + "id": "cohere-command-r-08-2024", + "name": "Command R", + "display_name": "Command R", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, @@ -38372,37 +36665,31 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 - }, - "type": "chat" + "input": 0.15, + "output": 0.6 + } }, { - "id": "gemini-2.5-flash-lite-preview-06-17", - "name": "Gemini 2.5 Flash Lite Preview 06-17", - "display_name": "Gemini 2.5 Flash Lite Preview 06-17", + "id": "grok-4", + "name": "Grok 4", + "display_name": "Grok 4", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -38410,175 +36697,148 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2025-07", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 - }, - "type": "chat" + "input": 3, + "output": 15, + "reasoning": 15, + "cache_read": 0.75 + } }, { - "id": "gemini-2.5-flash-preview-09-2025", - "name": "Gemini 2.5 Flash Preview 09-25", - "display_name": "Gemini 2.5 Flash Preview 09-25", + "id": "cohere-embed-v3-multilingual", + "name": "Embed v3 Multilingual", + "display_name": "Embed v3 Multilingual", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 512, + "output": 1024 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "attachment": false, + "open_weights": true, + "release_date": "2023-11-07", + "last_updated": "2023-11-07", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.383 - }, - "type": "chat" + "input": 0.1, + "output": 0 + } }, { - "id": "gemini-2.5-flash-preview-04-17", - "name": "Gemini 2.5 Flash Preview 04-17", - "display_name": "Gemini 2.5 Flash Preview 04-17", + "id": "phi-4-mini", + "name": "Phi-4-mini", + "display_name": "Phi-4-mini", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-04-17", - "last_updated": "2025-04-17", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.0375 - }, - "type": "chat" + "input": 0.075, + "output": 0.3 + } }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "gpt-4-32k", + "name": "GPT-4 32K", + "display_name": "GPT-4 32K", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2023-11", + "release_date": "2023-03-14", + "last_updated": "2023-03-14", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 - }, - "type": "chat" + "input": 60, + "output": 120 + } }, { - "id": "gemini-2.5-flash-lite-preview-09-2025", - "name": "Gemini 2.5 Flash Lite Preview 09-25", - "display_name": "Gemini 2.5 Flash Lite Preview 09-25", + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2025-08-31", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 - }, - "type": "chat" + "input": 1.75, + "output": 14, + "cache_read": 0.175 + } }, { - "id": "openai/gpt-oss-120b-maas", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "meta-llama-3.1-405b-instruct", + "name": "Meta-Llama-3.1-405B-Instruct", + "display_name": "Meta-Llama-3.1-405B-Instruct", "modalities": { "input": [ "text" @@ -38588,29 +36848,28 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.09, - "output": 0.36 - }, - "type": "chat" + "input": 5.33, + "output": 16 + } }, { - "id": "openai/gpt-oss-20b-maas", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ "text" @@ -38620,37 +36879,29 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 163840, + "output": 163840 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.07, - "output": 0.25 - }, - "type": "chat" - } - ] - }, - "cloudflare-workers-ai": { - "id": "cloudflare-workers-ai", - "name": "Cloudflare Workers AI", - "display_name": "Cloudflare Workers AI", - "doc": "https://developers.cloudflare.com/workers-ai/models/", - "models": [ + "input": 1.35, + "output": 5.4 + } + }, { - "id": "mistral-7b-instruct-v0.1-awq", - "name": "@hf/thebloke/mistral-7b-instruct-v0.1-awq", - "display_name": "@hf/thebloke/mistral-7b-instruct-v0.1-awq", + "id": "grok-code-fast-1", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ "text" @@ -38660,59 +36911,67 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 256000, + "output": 10000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2023-09-27", - "last_updated": "2023-11-09", + "open_weights": false, + "knowledge": "2023-10", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.2, + "output": 1.5, + "cache_read": 0.02 + } }, { - "id": "aura-1", - "name": "@cf/deepgram/aura-1", - "display_name": "@cf/deepgram/aura-1", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ + "text", + "image", "audio" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-27", - "last_updated": "2025-07-07", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 0.015, - "output": 0.015 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.125 + } }, { - "id": "mistral-7b-instruct-v0.2", - "name": "@hf/mistral/mistral-7b-instruct-v0.2", - "display_name": "@hf/mistral/mistral-7b-instruct-v0.2", + "id": "phi-3-mini-4k-instruct", + "name": "Phi-3-mini-instruct (4k)", + "display_name": "Phi-3-mini-instruct (4k)", "modalities": { "input": [ "text" @@ -38722,59 +36981,64 @@ ] }, "limit": { - "context": 3072, - "output": 4096 + "context": 4096, + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2023-12-11", - "last_updated": "2025-07-24", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.13, + "output": 0.52 + } }, { - "id": "tinyllama-1.1b-chat-v1.0", - "name": "@cf/tinyllama/tinyllama-1.1b-chat-v1.0", - "display_name": "@cf/tinyllama/tinyllama-1.1b-chat-v1.0", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2048, - "output": 2048 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2023-12-30", - "last_updated": "2024-03-17", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 + } }, { - "id": "qwen1.5-0.5b-chat", - "name": "@cf/qwen/qwen1.5-0.5b-chat", - "display_name": "@cf/qwen/qwen1.5-0.5b-chat", + "id": "deepseek-v3.2-speciale", + "name": "DeepSeek-V3.2-Speciale", + "display_name": "DeepSeek-V3.2-Speciale", "modalities": { "input": [ "text" @@ -38784,31 +37048,33 @@ ] }, "limit": { - "context": 32000, - "output": 32000 - }, + "context": 128000, + "output": 128000 + }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-01-31", - "last_updated": "2024-04-30", + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.58, + "output": 1.68 + } }, { - "id": "llama-3.2-11b-vision-instruct", - "name": "@cf/meta/llama-3.2-11b-vision-instruct", - "display_name": "@cf/meta/llama-3.2-11b-vision-instruct", + "id": "mistral-medium-2505", + "name": "Mistral Medium 3", + "display_name": "Mistral Medium 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -38823,51 +37089,56 @@ "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-09-18", - "last_updated": "2024-12-04", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 0.049, - "output": 0.68 - }, - "type": "chat" + "input": 0.4, + "output": 2 + } }, { - "id": "llama-2-13b-chat-awq", - "name": "@hf/thebloke/llama-2-13b-chat-awq", - "display_name": "@hf/thebloke/llama-2-13b-chat-awq", + "id": "claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2023-09-19", - "last_updated": "2023-11-09", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + } }, { - "id": "llama-3.1-8b-instruct-fp8", - "name": "@cf/meta/llama-3.1-8b-instruct-fp8", - "display_name": "@cf/meta/llama-3.1-8b-instruct-fp8", + "id": "phi-3-small-128k-instruct", + "name": "Phi-3-small-instruct (128k)", + "display_name": "Phi-3-small-instruct (128k)", "modalities": { "input": [ "text" @@ -38877,123 +37148,127 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-07-25", - "last_updated": "2024-07-25", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { "input": 0.15, - "output": 0.29 - }, - "type": "chat" + "output": 0.6 + } }, { - "id": "whisper", - "name": "@cf/openai/whisper", - "display_name": "@cf/openai/whisper", + "id": "cohere-command-a", + "name": "Command A", + "display_name": "Command A", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 256000, + "output": 8000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2023-11-07", - "last_updated": "2024-08-12", + "knowledge": "2024-06-01", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 0.00045, - "output": 0.00045 - }, - "type": "chat" + "input": 2.5, + "output": 10 + } }, { - "id": "stable-diffusion-xl-base-1.0", - "name": "@cf/stabilityai/stable-diffusion-xl-base-1.0", - "display_name": "@cf/stabilityai/stable-diffusion-xl-base-1.0", + "id": "cohere-command-r-plus-08-2024", + "name": "Command R+", + "display_name": "Command R+", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 4000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2023-07-25", - "last_updated": "2023-10-30", + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 2.5, + "output": 10 + } }, { - "id": "llama-2-7b-chat-fp16", - "name": "@cf/meta/llama-2-7b-chat-fp16", - "display_name": "@cf/meta/llama-2-7b-chat-fp16", + "id": "llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama 4 Maverick 17B 128E Instruct FP8", + "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2023-07-26", - "last_updated": "2023-07-26", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.56, - "output": 6.67 - }, - "type": "chat" + "input": 0.25, + "output": 1 + } }, { - "id": "resnet-50", - "name": "@cf/microsoft/resnet-50", - "display_name": "@cf/microsoft/resnet-50", + "id": "gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ + "text", "image" ], "output": [ @@ -39001,59 +37276,63 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1047576, + "output": 32768 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2022-03-16", - "last_updated": "2024-02-13", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.0000025, - "output": 0 - }, - "type": "chat" + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 + } }, { - "id": "stable-diffusion-v1-5-inpainting", - "name": "@cf/runwayml/stable-diffusion-v1-5-inpainting", - "display_name": "@cf/runwayml/stable-diffusion-v1-5-inpainting", + "id": "gpt-5-chat", + "name": "GPT-5 Chat", + "display_name": "GPT-5 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": false, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-02-27", - "last_updated": "2024-02-27", + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-24", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.13 + } }, { - "id": "sqlcoder-7b-2", - "name": "@cf/defog/sqlcoder-7b-2", - "display_name": "@cf/defog/sqlcoder-7b-2", + "id": "deepseek-v3.1", + "name": "DeepSeek-V3.1", + "display_name": "DeepSeek-V3.1", "modalities": { "input": [ "text" @@ -39063,28 +37342,29 @@ ] }, "limit": { - "context": 10000, - "output": 10000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-02-05", - "last_updated": "2024-02-12", + "knowledge": "2024-07", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.56, + "output": 1.68 + } }, { - "id": "llama-3-8b-instruct", - "name": "@cf/meta/llama-3-8b-instruct", - "display_name": "@cf/meta/llama-3-8b-instruct", + "id": "phi-4", + "name": "Phi-4", + "display_name": "Phi-4", "modalities": { "input": [ "text" @@ -39094,28 +37374,28 @@ ] }, "limit": { - "context": 7968, - "output": 7968 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-04-17", - "last_updated": "2025-06-19", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.28, - "output": 0.83 - }, - "type": "chat" + "input": 0.125, + "output": 0.5 + } }, { - "id": "llama-2-7b-chat-hf-lora", - "name": "@cf/meta-llama/llama-2-7b-chat-hf-lora", - "display_name": "@cf/meta-llama/llama-2-7b-chat-hf-lora", + "id": "phi-4-mini-reasoning", + "name": "Phi-4-mini-reasoning", + "display_name": "Phi-4-mini-reasoning", "modalities": { "input": [ "text" @@ -39125,59 +37405,65 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2023-07-13", - "last_updated": "2024-04-17", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.075, + "output": 0.3 + } }, { - "id": "llama-3.1-8b-instruct", - "name": "@cf/meta/llama-3.1-8b-instruct", - "display_name": "@cf/meta/llama-3.1-8b-instruct", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 7968, - "output": 7968 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-18", - "last_updated": "2024-09-25", + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.28, - "output": 0.83 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "openchat-3.5-0106", - "name": "@cf/openchat/openchat-3.5-0106", - "display_name": "@cf/openchat/openchat-3.5-0106", + "id": "gpt-3.5-turbo-0125", + "name": "GPT-3.5 Turbo 0125", + "display_name": "GPT-3.5 Turbo 0125", "modalities": { "input": [ "text" @@ -39187,28 +37473,28 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-01-07", - "last_updated": "2024-05-18", + "open_weights": false, + "knowledge": "2021-08", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.5, + "output": 1.5 + } }, { - "id": "openhermes-2.5-mistral-7b-awq", - "name": "@hf/thebloke/openhermes-2.5-mistral-7b-awq", - "display_name": "@hf/thebloke/openhermes-2.5-mistral-7b-awq", + "id": "grok-3", + "name": "Grok 3", + "display_name": "Grok 3", "modalities": { "input": [ "text" @@ -39218,8 +37504,8 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -39227,50 +37513,49 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2023-11-02", - "last_updated": "2023-11-09", + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.75 + } }, { - "id": "lucid-origin", - "name": "@cf/leonardo/lucid-origin", - "display_name": "@cf/leonardo/lucid-origin", + "id": "text-embedding-3-large", + "name": "text-embedding-3-large", + "display_name": "text-embedding-3-large", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 8191, + "output": 3072 }, - "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-25", - "last_updated": "2025-08-05", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 0.007, - "output": 0.007 - }, - "type": "chat" + "input": 0.13, + "output": 0 + } }, { - "id": "bart-large-cnn", - "name": "@cf/facebook/bart-large-cnn", - "display_name": "@cf/facebook/bart-large-cnn", + "id": "meta-llama-3-70b-instruct", + "name": "Meta-Llama-3-70B-Instruct", + "display_name": "Meta-Llama-3-70B-Instruct", "modalities": { "input": [ "text" @@ -39281,58 +37566,58 @@ }, "limit": { "context": 8192, - "output": 8192 + "output": 2048 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2022-03-02", - "last_updated": "2024-02-13", + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 2.68, + "output": 3.54 + } }, { - "id": "flux-1-schnell", - "name": "@cf/black-forest-labs/flux-1-schnell", - "display_name": "@cf/black-forest-labs/flux-1-schnell", + "id": "deepseek-v3-0324", + "name": "DeepSeek-V3-0324", + "display_name": "DeepSeek-V3-0324", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 2048, - "output": 8192 + "context": 131072, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-07-31", - "last_updated": "2024-08-16", + "knowledge": "2024-07", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 0.000053, - "output": 0.00011 - }, - "type": "chat" + "input": 1.14, + "output": 4.56 + } }, { - "id": "deepseek-r1-distill-qwen-32b", - "name": "@cf/deepseek-ai/deepseek-r1-distill-qwen-32b", - "display_name": "@cf/deepseek-ai/deepseek-r1-distill-qwen-32b", + "id": "phi-3-small-8k-instruct", + "name": "Phi-3-small-instruct (8k)", + "display_name": "Phi-3-small-instruct (8k)", "modalities": { "input": [ "text" @@ -39342,29 +37627,28 @@ ] }, "limit": { - "context": 80000, - "output": 80000 + "context": 8192, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-01-20", - "last_updated": "2025-02-24", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.5, - "output": 4.88 - }, - "type": "chat" + "input": 0.15, + "output": 0.6 + } }, { - "id": "gemma-2b-it-lora", - "name": "@cf/google/gemma-2b-it-lora", - "display_name": "@cf/google/gemma-2b-it-lora", + "id": "meta-llama-3.1-70b-instruct", + "name": "Meta-Llama-3.1-70B-Instruct", + "display_name": "Meta-Llama-3.1-70B-Instruct", "modalities": { "input": [ "text" @@ -39374,8 +37658,8 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -39384,49 +37668,50 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-04-02", - "last_updated": "2024-04-02", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 2.68, + "output": 3.54 + } }, { - "id": "una-cybertron-7b-v2-bf16", - "name": "@cf/fblgit/una-cybertron-7b-v2-bf16", - "display_name": "@cf/fblgit/una-cybertron-7b-v2-bf16", + "id": "gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 15000, - "output": 15000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2023-12-02", - "last_updated": "2024-03-08", + "attachment": true, + "open_weights": false, + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 10, + "output": 30 + } }, { - "id": "gemma-sea-lion-v4-27b-it", - "name": "@cf/aisingapore/gemma-sea-lion-v4-27b-it", - "display_name": "@cf/aisingapore/gemma-sea-lion-v4-27b-it", + "id": "gpt-3.5-turbo-0613", + "name": "GPT-3.5 Turbo 0613", + "display_name": "GPT-3.5 Turbo 0613", "modalities": { "input": [ "text" @@ -39436,28 +37721,28 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-23", - "last_updated": "2025-12-02", + "knowledge": "2021-08", + "release_date": "2023-06-13", + "last_updated": "2023-06-13", "cost": { - "input": 0.35, - "output": 0.56 - }, - "type": "chat" + "input": 3, + "output": 4 + } }, { - "id": "m2m100-1.2b", - "name": "@cf/meta/m2m100-1.2b", - "display_name": "@cf/meta/m2m100-1.2b", + "id": "phi-3.5-mini-instruct", + "name": "Phi-3.5-mini-instruct", + "display_name": "Phi-3.5-mini-instruct", "modalities": { "input": [ "text" @@ -39467,28 +37752,28 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2022-03-02", - "last_updated": "2023-11-16", + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.34, - "output": 0.34 - }, - "type": "chat" + "input": 0.13, + "output": 0.52 + } }, { - "id": "llama-3.2-3b-instruct", - "name": "@cf/meta/llama-3.2-3b-instruct", - "display_name": "@cf/meta/llama-3.2-3b-instruct", + "id": "o1-preview", + "name": "o1-preview", + "display_name": "o1-preview", "modalities": { "input": [ "text" @@ -39499,27 +37784,29 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 32768 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2024-09-18", - "last_updated": "2024-10-24", + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 0.051, - "output": 0.34 - }, - "type": "chat" + "input": 16.5, + "output": 66, + "cache_read": 8.25 + } }, { - "id": "qwen2.5-coder-32b-instruct", - "name": "@cf/qwen/qwen2.5-coder-32b-instruct", - "display_name": "@cf/qwen/qwen2.5-coder-32b-instruct", + "id": "llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -39529,7 +37816,7 @@ ] }, "limit": { - "context": 32768, + "context": 128000, "output": 32768 }, "temperature": true, @@ -39539,49 +37826,52 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-11-06", - "last_updated": "2025-01-12", + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.66, - "output": 1 - }, - "type": "chat" + "input": 0.71, + "output": 0.71 + } }, { - "id": "stable-diffusion-v1-5-img2img", - "name": "@cf/runwayml/stable-diffusion-v1-5-img2img", - "display_name": "@cf/runwayml/stable-diffusion-v1-5-img2img", + "id": "gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex Mini", + "display_name": "GPT-5.1 Codex Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2024-02-27", - "last_updated": "2024-02-27", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.25, + "output": 2, + "cache_read": 0.025 + } }, { - "id": "gemma-7b-it-lora", - "name": "@cf/google/gemma-7b-it-lora", - "display_name": "@cf/google/gemma-7b-it-lora", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -39591,59 +37881,60 @@ ] }, "limit": { - "context": 3500, - "output": 3500 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-04-02", - "last_updated": "2024-04-02", + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-12-02", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 + } }, { - "id": "qwen1.5-14b-chat-awq", - "name": "@cf/qwen/qwen1.5-14b-chat-awq", - "display_name": "@cf/qwen/qwen1.5-14b-chat-awq", + "id": "model-router", + "name": "Model Router", + "display_name": "Model Router", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 7500, - "output": 7500 + "context": 128000, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-02-03", - "last_updated": "2024-04-30", + "attachment": true, + "open_weights": false, + "release_date": "2025-05-19", + "last_updated": "2025-11-18", "cost": { - "input": 0, + "input": 0.14, "output": 0 - }, - "type": "chat" + } }, { - "id": "qwen1.5-1.8b-chat", - "name": "@cf/qwen/qwen1.5-1.8b-chat", - "display_name": "@cf/qwen/qwen1.5-1.8b-chat", + "id": "o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ "text" @@ -39653,153 +37944,167 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2024-01-30", - "last_updated": "2024-04-30", + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + } }, { - "id": "mistral-small-3.1-24b-instruct", - "name": "@cf/mistralai/mistral-small-3.1-24b-instruct", - "display_name": "@cf/mistralai/mistral-small-3.1-24b-instruct", + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { - "context": 128000, + "context": 272000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-03-11", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 0.35, - "output": 0.56 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.125 + } }, { - "id": "gemma-7b-it", - "name": "@hf/google/gemma-7b-it", - "display_name": "@hf/google/gemma-7b-it", + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-02-13", - "last_updated": "2024-08-14", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 + } }, { - "id": "qwen3-30b-a3b-fp8", - "name": "@cf/qwen/qwen3-30b-a3b-fp8", - "display_name": "@cf/qwen/qwen3-30b-a3b-fp8", + "id": "gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-30", - "last_updated": "2025-12-02", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.051, - "output": 0.34 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.13 + } }, { - "id": "llamaguard-7b-awq", - "name": "@hf/thebloke/llamaguard-7b-awq", - "display_name": "@hf/thebloke/llamaguard-7b-awq", + "id": "llama-3.2-90b-vision-instruct", + "name": "Llama-3.2-90B-Vision-Instruct", + "display_name": "Llama-3.2-90B-Vision-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2023-12-11", - "last_updated": "2023-12-11", + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 2.04, + "output": 2.04 + } }, { - "id": "hermes-2-pro-mistral-7b", - "name": "@hf/nousresearch/hermes-2-pro-mistral-7b", - "display_name": "@hf/nousresearch/hermes-2-pro-mistral-7b", + "id": "phi-3-mini-128k-instruct", + "name": "Phi-3-mini-instruct (128k)", + "display_name": "Phi-3-mini-instruct (128k)", "modalities": { "input": [ "text" @@ -39809,59 +38114,61 @@ ] }, "limit": { - "context": 24000, - "output": 24000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-03-11", - "last_updated": "2024-09-08", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.13, + "output": 0.52 + } }, { - "id": "granite-4.0-h-micro", - "name": "@cf/ibm-granite/granite-4.0-h-micro", - "display_name": "@cf/ibm-granite/granite-4.0-h-micro", + "id": "gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-10-07", - "last_updated": "2025-12-02", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 0.017, - "output": 0.11 - }, - "type": "chat" + "input": 2.5, + "output": 10, + "cache_read": 1.25 + } }, { - "id": "falcon-7b-instruct", - "name": "@cf/tiiuae/falcon-7b-instruct", - "display_name": "@cf/tiiuae/falcon-7b-instruct", + "id": "gpt-3.5-turbo-0301", + "name": "GPT-3.5 Turbo 0301", + "display_name": "GPT-3.5 Turbo 0301", "modalities": { "input": [ "text" @@ -39875,24 +38182,24 @@ "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2023-04-25", - "last_updated": "2024-10-12", + "open_weights": false, + "knowledge": "2021-08", + "release_date": "2023-03-01", + "last_updated": "2023-03-01", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 1.5, + "output": 2 + } }, { - "id": "llama-3.3-70b-instruct-fp8-fast", - "name": "@cf/meta/llama-3.3-70b-instruct-fp8-fast", - "display_name": "@cf/meta/llama-3.3-70b-instruct-fp8-fast", + "id": "ministral-3b", + "name": "Ministral 3B", + "display_name": "Ministral 3B", "modalities": { "input": [ "text" @@ -39902,8 +38209,8 @@ ] }, "limit": { - "context": 24000, - "output": 24000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -39912,173 +38219,184 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "knowledge": "2024-03", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.29, - "output": 2.25 - }, - "type": "chat" + "input": 0.04, + "output": 0.04 + } }, { - "id": "llama-3-8b-instruct-awq", - "name": "@cf/meta/llama-3-8b-instruct-awq", - "display_name": "@cf/meta/llama-3-8b-instruct-awq", + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-05-09", - "last_updated": "2024-05-09", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.12, - "output": 0.27 - }, - "type": "chat" + "input": 2, + "output": 8, + "cache_read": 0.5 + } }, { - "id": "phoenix-1.0", - "name": "@cf/leonardo/phoenix-1.0", - "display_name": "@cf/leonardo/phoenix-1.0", + "id": "o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 100000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-25", - "last_updated": "2025-08-25", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.0058, - "output": 0.0058 - }, - "type": "chat" + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 + } }, { - "id": "phi-2", - "name": "@cf/microsoft/phi-2", - "display_name": "@cf/microsoft/phi-2", + "id": "phi-4-multimodal", + "name": "Phi-4-multimodal", + "display_name": "Phi-4-multimodal", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 2048, - "output": 2048 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2023-12-13", - "last_updated": "2024-04-29", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.08, + "output": 0.32, + "input_audio": 4 + } }, { - "id": "dreamshaper-8-lcm", - "name": "@cf/lykon/dreamshaper-8-lcm", - "display_name": "@cf/lykon/dreamshaper-8-lcm", + "id": "meta-llama-3-8b-instruct", + "name": "Meta-Llama-3-8B-Instruct", + "display_name": "Meta-Llama-3-8B-Instruct", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { "context": 8192, - "output": 8192 + "output": 2048 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2023-12-06", - "last_updated": "2023-12-07", + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.3, + "output": 0.61 + } }, { - "id": "discolm-german-7b-v1-awq", - "name": "@cf/thebloke/discolm-german-7b-v1-awq", - "display_name": "@cf/thebloke/discolm-german-7b-v1-awq", + "id": "o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2024-01-18", - "last_updated": "2024-01-24", + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 15, + "output": 60, + "cache_read": 7.5 + } }, { - "id": "llama-2-7b-chat-int8", - "name": "@cf/meta/llama-2-7b-chat-int8", - "display_name": "@cf/meta/llama-2-7b-chat-int8", + "id": "grok-3-mini", + "name": "Grok 3 Mini", + "display_name": "Grok 3 Mini", "modalities": { "input": [ "text" @@ -40088,121 +38406,133 @@ ] }, "limit": { - "context": 8192, + "context": 131072, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2023-09-25", - "last_updated": "2023-09-25", + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 0.556, - "output": 6.667 - }, - "type": "chat" + "input": 0.3, + "output": 0.5, + "reasoning": 0.5, + "cache_read": 0.075 + } }, { - "id": "llama-3.2-1b-instruct", - "name": "@cf/meta/llama-3.2-1b-instruct", - "display_name": "@cf/meta/llama-3.2-1b-instruct", + "id": "gpt-5.1-chat", + "name": "GPT-5.1 Chat", + "display_name": "GPT-5.1 Chat", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { - "context": 60000, - "output": 60000 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-09-18", - "last_updated": "2024-10-24", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 0.027, - "output": 0.2 - }, - "type": "chat" - }, + "input": 1.25, + "output": 10, + "cache_read": 0.125 + } + }, { - "id": "whisper-large-v3-turbo", - "name": "@cf/openai/whisper-large-v3-turbo", - "display_name": "@cf/openai/whisper-large-v3-turbo", + "id": "phi-3.5-moe-instruct", + "name": "Phi-3.5-MoE-instruct", + "display_name": "Phi-3.5-MoE-instruct", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-10-01", - "last_updated": "2024-10-04", + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.00051, - "output": 0.00051 - }, - "type": "chat" + "input": 0.16, + "output": 0.64 + } }, { - "id": "llama-4-scout-17b-16e-instruct", - "name": "@cf/meta/llama-4-scout-17b-16e-instruct", - "display_name": "@cf/meta/llama-4-scout-17b-16e-instruct", + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-02", - "last_updated": "2025-05-23", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.27, - "output": 0.85 - }, - "type": "chat" + "input": 0.25, + "output": 2, + "cache_read": 0.03 + } }, { - "id": "starling-lm-7b-beta", - "name": "@hf/nexusflow/starling-lm-7b-beta", - "display_name": "@hf/nexusflow/starling-lm-7b-beta", + "id": "o1-mini", + "name": "o1-mini", + "display_name": "o1-mini", "modalities": { "input": [ "text" @@ -40212,59 +38542,62 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 128000, + "output": 65536 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2024-03-19", - "last_updated": "2024-04-03", + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + } }, { - "id": "deepseek-coder-6.7b-base-awq", - "name": "@hf/thebloke/deepseek-coder-6.7b-base-awq", - "display_name": "@hf/thebloke/deepseek-coder-6.7b-base-awq", + "id": "llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17B 16E Instruct", + "display_name": "Llama 4 Scout 17B 16E Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2023-11-05", - "last_updated": "2023-11-09", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.2, + "output": 0.78 + } }, { - "id": "gemma-3-12b-it", - "name": "@cf/google/gemma-3-12b-it", - "display_name": "@cf/google/gemma-3-12b-it", + "id": "cohere-embed-v3-english", + "name": "Embed v3 English", + "display_name": "Embed v3 English", "modalities": { "input": [ "text" @@ -40274,28 +38607,27 @@ ] }, "limit": { - "context": 80000, - "output": 80000 + "context": 512, + "output": 1024 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-03-01", - "last_updated": "2025-03-21", + "release_date": "2023-11-07", + "last_updated": "2023-11-07", "cost": { - "input": 0.35, - "output": 0.56 - }, - "type": "chat" + "input": 0.1, + "output": 0 + } }, { - "id": "llama-guard-3-8b", - "name": "@cf/meta/llama-guard-3-8b", - "display_name": "@cf/meta/llama-guard-3-8b", + "id": "text-embedding-ada-002", + "name": "text-embedding-ada-002", + "display_name": "text-embedding-ada-002", "modalities": { "input": [ "text" @@ -40305,28 +38637,26 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 8192, + "output": 1536 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-07-22", - "last_updated": "2024-10-11", + "open_weights": false, + "release_date": "2022-12-15", + "last_updated": "2022-12-15", "cost": { - "input": 0.48, - "output": 0.03 - }, - "type": "chat" + "input": 0.1, + "output": 0 + } }, { - "id": "neural-chat-7b-v3-1-awq", - "name": "@hf/thebloke/neural-chat-7b-v3-1-awq", - "display_name": "@hf/thebloke/neural-chat-7b-v3-1-awq", + "id": "meta-llama-3.1-8b-instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "display_name": "Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ "text" @@ -40336,8 +38666,8 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -40346,80 +38676,83 @@ }, "attachment": false, "open_weights": true, - "release_date": "2023-11-15", - "last_updated": "2023-11-17", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.3, + "output": 0.61 + } }, { - "id": "whisper-tiny-en", - "name": "@cf/openai/whisper-tiny-en", - "display_name": "@cf/openai/whisper-tiny-en", + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", "modalities": { "input": [ - "audio" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2022-09-26", - "last_updated": "2024-01-22", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.125 + } }, { - "id": "stable-diffusion-xl-lightning", - "name": "@cf/bytedance/stable-diffusion-xl-lightning", - "display_name": "@cf/bytedance/stable-diffusion-xl-lightning", + "id": "gpt-3.5-turbo-instruct", + "name": "GPT-3.5 Turbo Instruct", + "display_name": "GPT-3.5 Turbo Instruct", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-02-20", - "last_updated": "2024-04-03", + "open_weights": false, + "knowledge": "2021-08", + "release_date": "2023-09-21", + "last_updated": "2023-09-21", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 1.5, + "output": 2 + } }, { - "id": "mistral-7b-instruct-v0.1", - "name": "@cf/mistral/mistral-7b-instruct-v0.1", - "display_name": "@cf/mistral/mistral-7b-instruct-v0.1", + "id": "mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text" @@ -40429,8 +38762,8 @@ ] }, "limit": { - "context": 2824, - "output": 2824 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -40439,50 +38772,52 @@ }, "attachment": false, "open_weights": true, - "release_date": "2023-09-27", - "last_updated": "2025-07-24", + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.11, - "output": 0.19 - }, - "type": "chat" + "input": 0.15, + "output": 0.15 + } }, { - "id": "llava-1.5-7b-hf", - "name": "@cf/llava-hf/llava-1.5-7b-hf", - "display_name": "@cf/llava-hf/llava-1.5-7b-hf", + "id": "o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2023-12-05", - "last_updated": "2025-06-06", + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 2, + "output": 8, + "cache_read": 0.5 + } }, { - "id": "gpt-oss-20b", - "name": "@cf/openai/gpt-oss-20b", - "display_name": "@cf/openai/gpt-oss-20b", + "id": "codex-mini", + "name": "Codex Mini", + "display_name": "Codex Mini", "modalities": { "input": [ "text" @@ -40492,29 +38827,30 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-04", - "last_updated": "2025-08-14", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-05-16", + "last_updated": "2025-05-16", "cost": { - "input": 0.2, - "output": 0.3 - }, - "type": "chat" + "input": 1.5, + "output": 6, + "cache_read": 0.375 + } }, { - "id": "deepseek-math-7b-instruct", - "name": "@cf/deepseek-ai/deepseek-math-7b-instruct", - "display_name": "@cf/deepseek-ai/deepseek-math-7b-instruct", + "id": "phi-3-medium-4k-instruct", + "name": "Phi-3-medium-instruct (4k)", + "display_name": "Phi-3-medium-instruct (4k)", "modalities": { "input": [ "text" @@ -40525,27 +38861,27 @@ }, "limit": { "context": 4096, - "output": 4096 + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-02-05", - "last_updated": "2024-02-06", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.17, + "output": 0.68 + } }, { - "id": "gpt-oss-120b", - "name": "@cf/openai/gpt-oss-120b", - "display_name": "@cf/openai/gpt-oss-120b", + "id": "phi-4-reasoning", + "name": "Phi-4-reasoning", + "display_name": "Phi-4-reasoning", "modalities": { "input": [ "text" @@ -40555,10 +38891,10 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 32000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": true, @@ -40566,49 +38902,50 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-08-04", - "last_updated": "2025-08-14", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.35, - "output": 0.75 - }, - "type": "chat" + "input": 0.125, + "output": 0.5 + } }, { - "id": "melotts", - "name": "@cf/myshell-ai/melotts", - "display_name": "@cf/myshell-ai/melotts", + "id": "gpt-4-turbo-vision", + "name": "GPT-4 Turbo Vision", + "display_name": "GPT-4 Turbo Vision", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 4096 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2024-07-19", - "last_updated": "2024-07-19", + "open_weights": false, + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 0.0002, - "output": 0 - }, - "type": "chat" + "input": 10, + "output": 30 + } }, { - "id": "qwen1.5-7b-chat-awq", - "name": "@cf/qwen/qwen1.5-7b-chat-awq", - "display_name": "@cf/qwen/qwen1.5-7b-chat-awq", + "id": "phi-4-reasoning-plus", + "name": "Phi-4-reasoning-plus", + "display_name": "Phi-4-reasoning-plus", "modalities": { "input": [ "text" @@ -40618,31 +38955,33 @@ ] }, "limit": { - "context": 20000, - "output": 20000 + "context": 32000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-02-03", - "last_updated": "2024-04-30", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.125, + "output": 0.5 + } }, { - "id": "llama-3.1-8b-instruct-fast", - "name": "@cf/meta/llama-3.1-8b-instruct-fast", - "display_name": "@cf/meta/llama-3.1-8b-instruct-fast", + "id": "gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -40650,58 +38989,62 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", "release_date": "2024-07-18", - "last_updated": "2024-09-25", + "last_updated": "2024-07-18", "cost": { - "input": 0.045, - "output": 0.384 - }, - "type": "chat" + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 + } }, { - "id": "nova-3", - "name": "@cf/deepgram/nova-3", - "display_name": "@cf/deepgram/nova-3", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "audio" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 272000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-06-05", - "last_updated": "2025-07-08", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.0052, - "output": 0.0052 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.13 + } }, { - "id": "llama-3.1-70b-instruct", - "name": "@cf/meta/llama-3.1-70b-instruct", - "display_name": "@cf/meta/llama-3.1-70b-instruct", + "id": "mai-ds-r1", + "name": "MAI-DS-R1", + "display_name": "MAI-DS-R1", "modalities": { "input": [ "text" @@ -40711,28 +39054,29 @@ ] }, "limit": { - "context": 24000, - "output": 24000 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2024-07-16", - "last_updated": "2024-12-15", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.293, - "output": 2.253 - }, - "type": "chat" + "input": 1.35, + "output": 5.4 + } }, { - "id": "qwq-32b", - "name": "@cf/qwen/qwq-32b", - "display_name": "@cf/qwen/qwq-32b", + "id": "deepseek-v3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ "text" @@ -40742,59 +39086,62 @@ ] }, "limit": { - "context": 24000, - "output": 24000 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-03-05", - "last_updated": "2025-03-11", + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.66, - "output": 1 - }, - "type": "chat" + "input": 0.58, + "output": 1.68 + } }, { - "id": "zephyr-7b-beta-awq", - "name": "@hf/thebloke/zephyr-7b-beta-awq", - "display_name": "@hf/thebloke/zephyr-7b-beta-awq", + "id": "gpt-5-pro", + "name": "GPT-5 Pro", + "display_name": "GPT-5 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 400000, + "output": 272000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2023-10-27", - "last_updated": "2023-11-09", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 15, + "output": 120 + } }, { - "id": "deepseek-coder-6.7b-instruct-awq", - "name": "@hf/thebloke/deepseek-coder-6.7b-instruct-awq", - "display_name": "@hf/thebloke/deepseek-coder-6.7b-instruct-awq", + "id": "mistral-large-2411", + "name": "Mistral Large 24.11", + "display_name": "Mistral Large 24.11", "modalities": { "input": [ "text" @@ -40804,28 +39151,62 @@ ] }, "limit": { - "context": 4096, - "output": 4096 - }, + "context": 128000, + "output": 32768 + }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2023-11-05", - "last_updated": "2023-11-13", + "open_weights": false, + "knowledge": "2024-09", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0, - "output": 0 + "input": 2, + "output": 6 + } + }, + { + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] }, - "type": "chat" + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 1.75, + "output": 14, + "cache_read": 0.125 + } }, { - "id": "llama-3.1-8b-instruct-awq", - "name": "@cf/meta/llama-3.1-8b-instruct-awq", - "display_name": "@cf/meta/llama-3.1-8b-instruct-awq", + "id": "codestral-2501", + "name": "Codestral 25.01", + "display_name": "Codestral 25.01", "modalities": { "input": [ "text" @@ -40835,8 +39216,8 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -40844,53 +39225,53 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-07-25", - "last_updated": "2024-07-25", + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.12, - "output": 0.27 - }, - "type": "chat" + "input": 0.3, + "output": 0.9 + } }, { - "id": "mistral-7b-instruct-v0.2-lora", - "name": "@cf/mistral/mistral-7b-instruct-v0.2-lora", - "display_name": "@cf/mistral/mistral-7b-instruct-v0.2-lora", + "id": "mistral-small-2503", + "name": "Mistral Small 3.1", + "display_name": "Mistral Small 3.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 15000, - "output": 15000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-04-01", - "last_updated": "2024-04-01", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09", + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.1, + "output": 0.3 + } }, { - "id": "uform-gen2-qwen-500m", - "name": "@cf/unum/uform-gen2-qwen-500m", - "display_name": "@cf/unum/uform-gen2-qwen-500m", + "id": "gpt-3.5-turbo-1106", + "name": "GPT-3.5 Turbo 1106", + "display_name": "GPT-3.5 Turbo 1106", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -40898,37 +39279,37 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 16384, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-02-15", - "last_updated": "2024-04-24", + "open_weights": false, + "knowledge": "2021-08", + "release_date": "2023-11-06", + "last_updated": "2023-11-06", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 1, + "output": 2 + } } ] }, - "inception": { - "id": "inception", - "name": "Inception", - "display_name": "Inception", - "api": "https://api.inceptionlabs.ai/v1/", - "doc": "https://platform.inceptionlabs.ai/docs", + "baseten": { + "id": "baseten", + "name": "Baseten", + "display_name": "Baseten", + "api": "https://inference.baseten.co/v1", + "doc": "https://docs.baseten.co/development/model-apis/overview", "models": [ { - "id": "mercury-coder", - "name": "Mercury Coder", - "display_name": "Mercury Coder", + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "Kimi K2 Instruct 0905", + "display_name": "Kimi K2 Instruct 0905", "modalities": { "input": [ "text" @@ -40938,8 +39319,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -40947,22 +39328,19 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2025-02-26", - "last_updated": "2025-07-31", + "open_weights": true, + "knowledge": "2025-08", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.25, - "output": 1, - "cache_read": 0.25, - "cache_write": 1 - }, - "type": "chat" + "input": 0.6, + "output": 2.5 + } }, { - "id": "mercury", - "name": "Mercury", - "display_name": "Mercury", + "id": "moonshotai/Kimi-K2-Thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -40972,40 +39350,29 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2025-06-26", - "last_updated": "2025-07-31", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.25, - "output": 1, - "cache_read": 0.25, - "cache_write": 1 - }, - "type": "chat" - } - ] - }, - "wandb": { - "id": "wandb", - "name": "Weights & Biases", - "display_name": "Weights & Biases", - "api": "https://api.inference.wandb.ai/v1", - "doc": "https://weave-docs.wandb.ai/guides/integrations/inference/", - "models": [ + "input": 0.6, + "output": 2.5 + } + }, { - "id": "moonshotai/Kimi-K2-Instruct", - "name": "Kimi-K2-Instruct", - "display_name": "Kimi-K2-Instruct", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" @@ -41015,8 +39382,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 66536 }, "temperature": true, "tool_call": true, @@ -41025,19 +39392,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-14", - "last_updated": "2025-07-14", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 1.35, - "output": 4 - }, - "type": "chat" + "input": 0.38, + "output": 1.53 + } }, { - "id": "microsoft/Phi-4-mini-instruct", - "name": "Phi-4-mini-instruct", - "display_name": "Phi-4-mini-instruct", + "id": "zai-org/GLM-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -41047,8 +39413,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -41058,19 +39424,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.08, - "output": 0.35 - }, - "type": "chat" + "input": 0.6, + "output": 2.2 + } }, { - "id": "meta-llama/Llama-3.1-8B-Instruct", - "name": "Meta-Llama-3.1-8B-Instruct", - "display_name": "Meta-Llama-3.1-8B-Instruct", + "id": "zai-org/GLM-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ "text" @@ -41080,30 +39445,28 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 200000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2025-08-31", + "release_date": "2025-09-16", + "last_updated": "2025-09-16", "cost": { - "input": 0.22, - "output": 0.22 - }, - "type": "chat" + "input": 0.6, + "output": 2.2 + } }, { - "id": "meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -41113,42 +39476,48 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 163800, + "output": 131100 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "knowledge": "2025-10", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.71, - "output": 0.71 - }, - "type": "chat" - }, + "input": 0.3, + "output": 0.45 + } + } + ] + }, + "moark": { + "id": "moark", + "name": "Moark", + "display_name": "Moark", + "api": "https://moark.com/v1", + "doc": "https://moark.com/docs/openapi/v1#tag/%E6%96%87%E6%9C%AC%E7%94%9F%E6%88%90", + "models": [ { - "id": "meta-llama/Llama-4-Scout-17B-16E-Instruct", - "name": "Llama 4 Scout 17B 16E Instruct", - "display_name": "Llama 4 Scout 17B 16E Instruct", + "id": "GLM-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -41158,19 +39527,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.17, - "output": 0.66 - }, - "type": "chat" + "input": 3.5, + "output": 14 + } }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" @@ -41180,29 +39548,37 @@ ] }, "limit": { - "context": 262144, + "context": 204800, "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04-28", - "last_updated": "2025-07-21", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.1, - "output": 0.1 - }, - "type": "chat" - }, + "input": 2.1, + "output": 8.4 + } + } + ] + }, + "siliconflow-com": { + "id": "siliconflow-com", + "name": "SiliconFlow", + "display_name": "SiliconFlow", + "api": "https://api.siliconflow.com/v1", + "doc": "https://cloud.siliconflow.com/models", + "models": [ { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "name": "Qwen3-Coder-480B-A35B-Instruct", - "display_name": "Qwen3-Coder-480B-A35B-Instruct", + "id": "inclusionAI/Ling-mini-2.0", + "name": "inclusionAI/Ling-mini-2.0", + "display_name": "inclusionAI/Ling-mini-2.0", "modalities": { "input": [ "text" @@ -41212,8 +39588,8 @@ ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -41221,20 +39597,18 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": false, + "release_date": "2025-09-10", + "last_updated": "2025-11-25", "cost": { - "input": 1, - "output": 1.5 - }, - "type": "chat" + "input": 0.07, + "output": 0.28 + } }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3-235B-A22B-Thinking-2507", - "display_name": "Qwen3-235B-A22B-Thinking-2507", + "id": "inclusionAI/Ling-flash-2.0", + "name": "inclusionAI/Ling-flash-2.0", + "display_name": "inclusionAI/Ling-flash-2.0", "modalities": { "input": [ "text" @@ -41244,30 +39618,27 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "open_weights": false, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.1, - "output": 0.1 - }, - "type": "chat" + "input": 0.14, + "output": 0.57 + } }, { - "id": "deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek-R1-0528", - "display_name": "DeepSeek-R1-0528", + "id": "inclusionAI/Ring-flash-2.0", + "name": "inclusionAI/Ring-flash-2.0", + "display_name": "inclusionAI/Ring-flash-2.0", "modalities": { "input": [ "text" @@ -41277,8 +39648,8 @@ ] }, "limit": { - "context": 161000, - "output": 163840 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -41287,20 +39658,18 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "open_weights": false, + "release_date": "2025-09-29", + "last_updated": "2025-11-25", "cost": { - "input": 1.35, - "output": 5.4 - }, - "type": "chat" + "input": 0.14, + "output": 0.57 + } }, { - "id": "deepseek-ai/DeepSeek-V3-0324", - "name": "DeepSeek-V3-0324", - "display_name": "DeepSeek-V3-0324", + "id": "moonshotai/Kimi-K2-Instruct", + "name": "moonshotai/Kimi-K2-Instruct", + "display_name": "moonshotai/Kimi-K2-Instruct", "modalities": { "input": [ "text" @@ -41310,8 +39679,8 @@ ] }, "limit": { - "context": 161000, - "output": 8192 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -41319,29 +39688,18 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "open_weights": false, + "release_date": "2025-07-13", + "last_updated": "2025-11-25", "cost": { - "input": 1.14, - "output": 2.75 - }, - "type": "chat" - } - ] - }, - "cloudflare-ai-gateway": { - "id": "cloudflare-ai-gateway", - "name": "Cloudflare AI Gateway", - "display_name": "Cloudflare AI Gateway", - "api": "https://gateway.ai.cloudflare.com/v1/${CLOUDFLARE_ACCOUNT_ID}/${CLOUDFLARE_GATEWAY_ID}/compat/", - "doc": "https://developers.cloudflare.com/ai-gateway/", - "models": [ + "input": 0.58, + "output": 2.29 + } + }, { - "id": "openai/gpt-4", - "name": "GPT-4", - "display_name": "GPT-4", + "id": "moonshotai/Kimi-Dev-72B", + "name": "moonshotai/Kimi-Dev-72B", + "display_name": "moonshotai/Kimi-Dev-72B", "modalities": { "input": [ "text" @@ -41351,29 +39709,27 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "release_date": "2025-06-19", + "last_updated": "2025-11-25", "cost": { - "input": 30, - "output": 60 - }, - "type": "chat" + "input": 0.29, + "output": 1.15 + } }, { - "id": "openai/gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "moonshotai/Kimi-K2.5", + "name": "moonshotai/Kimi-K2.5", + "display_name": "moonshotai/Kimi-K2.5", "modalities": { "input": [ "text", @@ -41384,31 +39740,28 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262000, + "output": 262000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 - }, - "type": "chat" + "input": 0.55, + "output": 3 + } }, { - "id": "openai/gpt-3.5-turbo", - "name": "GPT-3.5-turbo", - "display_name": "GPT-3.5-turbo", + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "moonshotai/Kimi-K2-Instruct-0905", + "display_name": "moonshotai/Kimi-K2-Instruct-0905", "modalities": { "input": [ "text" @@ -41418,63 +39771,58 @@ ] }, "limit": { - "context": 16385, - "output": 4096 + "context": 262000, + "output": 262000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2021-09-01", - "release_date": "2023-03-01", - "last_updated": "2023-11-06", + "release_date": "2025-09-08", + "last_updated": "2025-11-25", "cost": { - "input": 0.5, - "output": 1.5, - "cache_read": 1.25 - }, - "type": "chat" + "input": 0.4, + "output": 2 + } }, { - "id": "openai/gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "moonshotai/Kimi-K2-Thinking", + "name": "moonshotai/Kimi-K2-Thinking", + "display_name": "moonshotai/Kimi-K2-Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "release_date": "2025-11-07", + "last_updated": "2025-11-25", "cost": { - "input": 10, - "output": 30 - }, - "type": "chat" + "input": 0.55, + "output": 2.5 + } }, { - "id": "openai/o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "tencent/Hunyuan-MT-7B", + "name": "tencent/Hunyuan-MT-7B", + "display_name": "tencent/Hunyuan-MT-7B", "modalities": { "input": [ "text" @@ -41484,204 +39832,178 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 33000, + "output": 33000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "release_date": "2025-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "openai/gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "tencent/Hunyuan-A13B-Instruct", + "name": "tencent/Hunyuan-A13B-Instruct", + "display_name": "tencent/Hunyuan-A13B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131000, + "output": 131000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-06-30", + "last_updated": "2025-11-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 - }, - "type": "chat" + "input": 0.14, + "output": 0.57 + } }, { - "id": "openai/gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "MiniMaxAI/MiniMax-M2", + "name": "MiniMaxAI/MiniMax-M2", + "display_name": "MiniMaxAI/MiniMax-M2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 197000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "release_date": "2025-10-28", + "last_updated": "2025-11-25", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 - }, - "type": "chat" + "input": 0.3, + "output": 1.2 + } }, { - "id": "openai/o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "MiniMaxAI/MiniMax-M1-80k", + "name": "MiniMaxAI/MiniMax-M1-80k", + "display_name": "MiniMaxAI/MiniMax-M1-80k", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131000, + "output": 131000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2025-06-17", + "last_updated": "2025-11-25", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 - }, - "type": "chat" + "input": 0.55, + "output": 2.2 + } }, { - "id": "openai/o1", - "name": "o1", - "display_name": "o1", + "id": "MiniMaxAI/MiniMax-M2.1", + "name": "MiniMaxAI/MiniMax-M2.1", + "display_name": "MiniMaxAI/MiniMax-M2.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 197000, + "output": 131000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 - }, - "type": "chat" + "input": 0.3, + "output": 1.2 + } }, { - "id": "openai/o3-pro", - "name": "o3-pro", - "display_name": "o3-pro", + "id": "THUDM/GLM-4-32B-0414", + "name": "THUDM/GLM-4-32B-0414", + "display_name": "THUDM/GLM-4-32B-0414", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 33000, + "output": 33000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-06-10", - "last_updated": "2025-06-10", + "release_date": "2025-04-18", + "last_updated": "2025-11-25", "cost": { - "input": 20, - "output": 80 - }, - "type": "chat" + "input": 0.27, + "output": 0.27 + } }, { - "id": "openai/o3", - "name": "o3", - "display_name": "o3", + "id": "THUDM/GLM-4.1V-9B-Thinking", + "name": "THUDM/GLM-4.1V-9B-Thinking", + "display_name": "THUDM/GLM-4.1V-9B-Thinking", "modalities": { "input": [ "text", @@ -41692,10 +40014,10 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 66000, + "output": 66000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -41703,102 +40025,89 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2025-07-04", + "last_updated": "2025-11-25", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 - }, - "type": "chat" + "input": 0.035, + "output": 0.14 + } }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "THUDM/GLM-Z1-9B-0414", + "name": "THUDM/GLM-Z1-9B-0414", + "display_name": "THUDM/GLM-Z1-9B-0414", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2025-04-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 - }, - "type": "chat" + "input": 0.086, + "output": 0.086 + } }, { - "id": "openai/gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "THUDM/GLM-4-9B-0414", + "name": "THUDM/GLM-4-9B-0414", + "display_name": "THUDM/GLM-4-9B-0414", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 33000, + "output": 33000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2025-04-18", + "last_updated": "2025-11-25", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 - }, - "type": "chat" + "input": 0.086, + "output": 0.086 + } }, { - "id": "anthropic/claude-opus-4", - "name": "Claude Opus 4 (latest)", - "display_name": "Claude Opus 4 (latest)", + "id": "THUDM/GLM-Z1-32B-0414", + "name": "THUDM/GLM-Z1-32B-0414", + "display_name": "THUDM/GLM-Z1-32B-0414", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -41806,73 +40115,60 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-04-18", + "last_updated": "2025-11-25", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" + "input": 0.14, + "output": 0.57 + } }, { - "id": "anthropic/claude-opus-4-1", - "name": "Claude Opus 4.1 (latest)", - "display_name": "Claude Opus 4.1 (latest)", + "id": "openai/gpt-oss-20b", + "name": "openai/gpt-oss-20b", + "display_name": "openai/gpt-oss-20b", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 131000, + "output": 8000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-08-13", + "last_updated": "2025-11-25", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" + "input": 0.04, + "output": 0.18 + } }, { - "id": "anthropic/claude-haiku-4-5", - "name": "Claude Haiku 4.5 (latest)", - "display_name": "Claude Haiku 4.5 (latest)", + "id": "openai/gpt-oss-120b", + "name": "openai/gpt-oss-120b", + "display_name": "openai/gpt-oss-120b", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131000, + "output": 8000 }, "temperature": true, "tool_call": true, @@ -41880,36 +40176,31 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "release_date": "2025-08-13", + "last_updated": "2025-11-25", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 - }, - "type": "chat" + "input": 0.05, + "output": 0.45 + } }, { - "id": "anthropic/claude-3-haiku", - "name": "Claude Haiku 3", - "display_name": "Claude Haiku 3", + "id": "stepfun-ai/step3", + "name": "stepfun-ai/step3", + "display_name": "stepfun-ai/step3", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 66000, + "output": 66000 }, "temperature": true, "tool_call": true, @@ -41918,34 +40209,28 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-13", - "last_updated": "2024-03-13", + "release_date": "2025-08-06", + "last_updated": "2025-11-25", "cost": { - "input": 0.25, - "output": 1.25, - "cache_read": 0.03, - "cache_write": 0.3 - }, - "type": "chat" + "input": 0.57, + "output": 1.42 + } }, { - "id": "anthropic/claude-opus-4-5", - "name": "Claude Opus 4.5 (latest)", - "display_name": "Claude Opus 4.5 (latest)", + "id": "nex-agi/DeepSeek-V3.1-Nex-N1", + "name": "nex-agi/DeepSeek-V3.1-Nex-N1", + "display_name": "nex-agi/DeepSeek-V3.1-Nex-N1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -41953,217 +40238,182 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "release_date": "2025-01-01", + "last_updated": "2025-11-25", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 - }, - "type": "chat" + "input": 0.5, + "output": 2 + } }, { - "id": "anthropic/claude-3-opus", - "name": "Claude Opus 3", - "display_name": "Claude Opus 3", + "id": "baidu/ERNIE-4.5-300B-A47B", + "name": "baidu/ERNIE-4.5-300B-A47B", + "display_name": "baidu/ERNIE-4.5-300B-A47B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-02-29", - "last_updated": "2024-02-29", + "release_date": "2025-07-02", + "last_updated": "2025-11-25", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" + "input": 0.28, + "output": 1.1 + } }, { - "id": "anthropic/claude-sonnet-4-5", - "name": "Claude Sonnet 4.5 (latest)", - "display_name": "Claude Sonnet 4.5 (latest)", + "id": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "display_name": "ByteDance-Seed/Seed-OSS-36B-Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2025-09-04", + "last_updated": "2025-11-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0.21, + "output": 0.57 + } }, { - "id": "anthropic/claude-3.5-sonnet", - "name": "Claude Sonnet 3.5 v2", - "display_name": "Claude Sonnet 3.5 v2", + "id": "meta-llama/Meta-Llama-3.1-8B-Instruct", + "name": "meta-llama/Meta-Llama-3.1-8B-Instruct", + "display_name": "meta-llama/Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 33000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "release_date": "2025-04-23", + "last_updated": "2025-11-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0.06, + "output": 0.06 + } }, { - "id": "anthropic/claude-3-sonnet", - "name": "Claude Sonnet 3", - "display_name": "Claude Sonnet 3", + "id": "Qwen/Qwen3-30B-A3B", + "name": "Qwen/Qwen3-30B-A3B", + "display_name": "Qwen/Qwen3-30B-A3B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-04", - "last_updated": "2024-03-04", + "release_date": "2025-04-30", + "last_updated": "2025-11-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 0.3 - }, - "type": "chat" + "input": 0.09, + "output": 0.45 + } }, { - "id": "anthropic/claude-3-5-haiku", - "name": "Claude Haiku 3.5 (latest)", - "display_name": "Claude Haiku 3.5 (latest)", + "id": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "name": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "display_name": "Qwen/Qwen3-30B-A3B-Thinking-2507", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 262000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "release_date": "2025-07-31", + "last_updated": "2025-11-25", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 - }, - "type": "chat" + "input": 0.09, + "output": 0.3 + } }, { - "id": "anthropic/claude-3.5-haiku", - "name": "Claude Haiku 3.5 (latest)", - "display_name": "Claude Haiku 3.5 (latest)", + "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "name": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "display_name": "Qwen/Qwen3-VL-30B-A3B-Instruct", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -42172,66 +40422,47 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "release_date": "2025-10-05", + "last_updated": "2025-11-25", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 - }, - "type": "chat" + "input": 0.29, + "output": 1 + } }, { - "id": "anthropic/claude-sonnet-4", - "name": "Claude Sonnet 4 (latest)", - "display_name": "Claude Sonnet 4 (latest)", + "id": "Qwen/Qwen3-14B", + "name": "Qwen/Qwen3-14B", + "display_name": "Qwen/Qwen3-14B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-04-30", + "last_updated": "2025-11-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" - } - ] - }, - "openai": { - "id": "openai", - "name": "OpenAI", - "display_name": "OpenAI", - "doc": "https://platform.openai.com/docs/models", - "models": [ + "input": 0.07, + "output": 0.28 + } + }, { - "id": "gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", + "id": "Qwen/Qwen2.5-VL-32B-Instruct", + "name": "Qwen/Qwen2.5-VL-32B-Instruct", + "display_name": "Qwen/Qwen2.5-VL-32B-Instruct", "modalities": { "input": [ "text", @@ -42242,8 +40473,8 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -42252,52 +40483,47 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2025-03-24", + "last_updated": "2025-11-25", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.03 - }, - "type": "chat" + "input": 0.27, + "output": 0.27 + } }, { - "id": "text-embedding-3-small", - "name": "text-embedding-3-small", - "display_name": "text-embedding-3-small", + "id": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "display_name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", "modalities": { "input": [ - "text" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 8191, - "output": 1536 + "context": 66000, + "output": 66000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-01", - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.02, - "output": 0 - }, - "type": "embedding" + "input": 0.1, + "output": 0.4 + } }, { - "id": "gpt-4", - "name": "GPT-4", - "display_name": "GPT-4", + "id": "Qwen/Qwen3-8B", + "name": "Qwen/Qwen3-8B", + "display_name": "Qwen/Qwen3-8B", "modalities": { "input": [ "text" @@ -42307,63 +40533,59 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "release_date": "2025-04-30", + "last_updated": "2025-11-25", "cost": { - "input": 30, - "output": 60 - }, - "type": "chat" + "input": 0.06, + "output": 0.06 + } }, { - "id": "o1-pro", - "name": "o1-pro", - "display_name": "o1-pro", + "id": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 66000, + "output": 66000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2025-03-19", - "last_updated": "2025-03-19", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 150, - "output": 600 - }, - "type": "chat" + "input": 0.1, + "output": 0.4 + } }, { - "id": "gpt-4o-2024-05-13", - "name": "GPT-4o (2024-05-13)", - "display_name": "GPT-4o (2024-05-13)", + "id": "Qwen/Qwen3-VL-8B-Thinking", + "name": "Qwen/Qwen3-VL-8B-Thinking", + "display_name": "Qwen/Qwen3-VL-8B-Thinking", "modalities": { "input": [ "text", @@ -42374,167 +40596,148 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "release_date": "2025-10-15", + "last_updated": "2025-11-25", "cost": { - "input": 5, - "output": 15 - }, - "type": "chat" + "input": 0.18, + "output": 2 + } }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "display_name": "Qwen/Qwen3-235B-A22B-Instruct-2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262000, + "output": 262000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-07-23", + "last_updated": "2025-11-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 - }, - "type": "chat" + "input": 0.09, + "output": 0.6 + } }, { - "id": "gpt-4o-2024-08-06", - "name": "GPT-4o (2024-08-06)", - "display_name": "GPT-4o (2024-08-06)", + "id": "Qwen/Qwen2.5-Coder-32B-Instruct", + "name": "Qwen/Qwen2.5-Coder-32B-Instruct", + "display_name": "Qwen/Qwen2.5-Coder-32B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 33000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-08-06", - "last_updated": "2024-08-06", + "release_date": "2024-11-11", + "last_updated": "2025-11-25", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 - }, - "type": "chat" + "input": 0.18, + "output": 0.18 + } }, { - "id": "gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "Qwen/Qwen2.5-32B-Instruct", + "name": "Qwen/Qwen2.5-32B-Instruct", + "display_name": "Qwen/Qwen2.5-32B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 33000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2024-09-19", + "last_updated": "2025-11-25", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 - }, - "type": "chat" + "input": 0.18, + "output": 0.18 + } }, { - "id": "o3-deep-research", - "name": "o3-deep-research", - "display_name": "o3-deep-research", + "id": "Qwen/Qwen2.5-72B-Instruct-128K", + "name": "Qwen/Qwen2.5-72B-Instruct-128K", + "display_name": "Qwen/Qwen2.5-72B-Instruct-128K", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131000, + "output": 4000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-06-26", - "last_updated": "2024-06-26", + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 10, - "output": 40, - "cache_read": 2.5 - }, - "type": "chat" + "input": 0.59, + "output": 0.59 + } }, { - "id": "gpt-3.5-turbo", - "name": "GPT-3.5-turbo", - "display_name": "GPT-3.5-turbo", + "id": "Qwen/Qwen2.5-72B-Instruct", + "name": "Qwen/Qwen2.5-72B-Instruct", + "display_name": "Qwen/Qwen2.5-72B-Instruct", "modalities": { "input": [ "text" @@ -42544,64 +40747,57 @@ ] }, "limit": { - "context": 16385, - "output": 4096 + "context": 33000, + "output": 4000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2021-09-01", - "release_date": "2023-03-01", - "last_updated": "2023-11-06", + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.5, - "output": 1.5, - "cache_read": 1.25 - }, - "type": "chat" + "input": 0.59, + "output": 0.59 + } }, { - "id": "gpt-5.2-pro", - "name": "GPT-5.2 Pro", - "display_name": "GPT-5.2 Pro", + "id": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262000, + "output": 262000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2025-08-01", + "last_updated": "2025-11-25", "cost": { - "input": 21, - "output": 168 - }, - "type": "chat" + "input": 0.07, + "output": 0.28 + } }, { - "id": "text-embedding-3-large", - "name": "text-embedding-3-large", - "display_name": "text-embedding-3-large", + "id": "Qwen/Qwen2.5-7B-Instruct", + "name": "Qwen/Qwen2.5-7B-Instruct", + "display_name": "Qwen/Qwen2.5-7B-Instruct", "modalities": { "input": [ "text" @@ -42611,29 +40807,57 @@ ] }, "limit": { - "context": 8191, - "output": 3072 + "context": 33000, + "output": 4000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-01", - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.13, - "output": 0 + "input": 0.05, + "output": 0.05 + } + }, + { + "id": "Qwen/Qwen3-235B-A22B", + "name": "Qwen/Qwen3-235B-A22B", + "display_name": "Qwen/Qwen3-235B-A22B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] }, - "type": "embedding" + "limit": { + "context": 131000, + "output": 131000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-04-30", + "last_updated": "2025-11-25", + "cost": { + "input": 0.35, + "output": 1.42 + } }, { - "id": "gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "Qwen/Qwen2.5-VL-72B-Instruct", + "name": "Qwen/Qwen2.5-VL-72B-Instruct", + "display_name": "Qwen/Qwen2.5-VL-72B-Instruct", "modalities": { "input": [ "text", @@ -42644,8 +40868,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131000, + "output": 4000 }, "temperature": true, "tool_call": true, @@ -42654,19 +40878,17 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "release_date": "2025-01-28", + "last_updated": "2025-11-25", "cost": { - "input": 10, - "output": 30 - }, - "type": "chat" + "input": 0.59, + "output": 0.59 + } }, { - "id": "o1-preview", - "name": "o1-preview", - "display_name": "o1-preview", + "id": "Qwen/QwQ-32B", + "name": "Qwen/QwQ-32B", + "display_name": "Qwen/QwQ-32B", "modalities": { "input": [ "text" @@ -42676,31 +40898,28 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131000, + "output": 131000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "release_date": "2025-03-06", + "last_updated": "2025-11-25", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 - }, - "type": "chat" + "input": 0.15, + "output": 0.58 + } }, { - "id": "gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex mini", - "display_name": "GPT-5.1 Codex mini", + "id": "Qwen/Qwen2.5-VL-7B-Instruct", + "name": "Qwen/Qwen2.5-VL-7B-Instruct", + "display_name": "Qwen/Qwen2.5-VL-7B-Instruct", "modalities": { "input": [ "text", @@ -42711,31 +40930,27 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 33000, + "output": 4000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-01-28", + "last_updated": "2025-11-25", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 - }, - "type": "chat" + "input": 0.05, + "output": 0.05 + } }, { - "id": "o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "Qwen/Qwen3-32B", + "name": "Qwen/Qwen3-32B", + "display_name": "Qwen/Qwen3-32B", "modalities": { "input": [ "text" @@ -42745,31 +40960,27 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131000, + "output": 131000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "release_date": "2025-04-30", + "last_updated": "2025-11-25", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 - }, - "type": "chat" + "input": 0.14, + "output": 0.57 + } }, { - "id": "gpt-5.2-chat-latest", - "name": "GPT-5.2 Chat", - "display_name": "GPT-5.2 Chat", + "id": "Qwen/Qwen3-VL-8B-Instruct", + "name": "Qwen/Qwen3-VL-8B-Instruct", + "display_name": "Qwen/Qwen3-VL-8B-Instruct", "modalities": { "input": [ "text", @@ -42780,31 +40991,27 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262000, + "output": 262000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2025-10-15", + "last_updated": "2025-11-25", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 - }, - "type": "chat" + "input": 0.18, + "output": 0.68 + } }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "display_name": "Qwen/Qwen3-VL-235B-A22B-Instruct", "modalities": { "input": [ "text", @@ -42815,31 +41022,27 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262000, + "output": 262000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 - }, - "type": "chat" + "input": 0.3, + "output": 1.5 + } }, { - "id": "codex-mini-latest", - "name": "Codex Mini", - "display_name": "Codex Mini", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "display_name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", "modalities": { "input": [ "text" @@ -42849,31 +41052,27 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262000, + "output": 262000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-05-16", - "last_updated": "2025-05-16", + "release_date": "2025-07-31", + "last_updated": "2025-11-25", "cost": { - "input": 1.5, - "output": 6, - "cache_read": 0.375 - }, - "type": "chat" + "input": 0.25, + "output": 1 + } }, { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "name": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "display_name": "Qwen/Qwen3-VL-235B-A22B-Thinking", "modalities": { "input": [ "text", @@ -42884,10 +41083,10 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262000, + "output": 262000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -42895,55 +41094,47 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.01 - }, - "type": "chat" + "input": 0.45, + "output": 3.5 + } }, { - "id": "gpt-5-codex", - "name": "GPT-5-Codex", - "display_name": "GPT-5-Codex", + "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "name": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "display_name": "Qwen/Qwen3-30B-A3B-Instruct-2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262000, + "output": 262000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "release_date": "2025-07-30", + "last_updated": "2025-11-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 - }, - "type": "chat" + "input": 0.09, + "output": 0.3 + } }, { - "id": "gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "name": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "display_name": "Qwen/Qwen3-VL-30B-A3B-Thinking", "modalities": { "input": [ "text", @@ -42954,30 +41145,28 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "release_date": "2025-10-11", + "last_updated": "2025-11-25", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 - }, - "type": "chat" + "input": 0.29, + "output": 1 + } }, { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "Qwen/Qwen3-VL-32B-Thinking", + "name": "Qwen/Qwen3-VL-32B-Thinking", + "display_name": "Qwen/Qwen3-VL-32B-Thinking", "modalities": { "input": [ "text", @@ -42988,79 +41177,74 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2025-10-21", + "last_updated": "2025-11-25", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 - }, - "type": "chat" + "input": 0.2, + "output": 1.5 + } }, { - "id": "o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "display_name": "Qwen/Qwen3-235B-A22B-Thinking-2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262000, + "output": 262000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2025-07-28", + "last_updated": "2025-11-25", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 - }, - "type": "chat" + "input": 0.13, + "output": 0.6 + } }, { - "id": "o1", - "name": "o1", - "display_name": "o1", + "id": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "display_name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 66000, + "output": 66000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -43068,20 +41252,17 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 - }, - "type": "chat" + "input": 0.1, + "output": 0.4 + } }, { - "id": "gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "Qwen/Qwen3-VL-32B-Instruct", + "name": "Qwen/Qwen3-VL-32B-Instruct", + "display_name": "Qwen/Qwen3-VL-32B-Instruct", "modalities": { "input": [ "text", @@ -43092,31 +41273,27 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262000, + "output": 262000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-10-21", + "last_updated": "2025-11-25", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.03 - }, - "type": "chat" + "input": 0.2, + "output": 0.6 + } }, { - "id": "o1-mini", - "name": "o1-mini", - "display_name": "o1-mini", + "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Next-80B-A3B-Instruct", "modalities": { "input": [ "text" @@ -43126,31 +41303,27 @@ ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 262000, + "output": 262000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "release_date": "2025-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 - }, - "type": "chat" + "input": 0.14, + "output": 1.4 + } }, { - "id": "text-embedding-ada-002", - "name": "text-embedding-ada-002", - "display_name": "text-embedding-ada-002", + "id": "Qwen/Qwen2.5-14B-Instruct", + "name": "Qwen/Qwen2.5-14B-Instruct", + "display_name": "Qwen/Qwen2.5-14B-Instruct", "modalities": { "input": [ "text" @@ -43160,63 +41333,58 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 33000, + "output": 4000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2022-12", - "release_date": "2022-12-15", - "last_updated": "2022-12-15", + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { "input": 0.1, - "output": 0 - }, - "type": "embedding" + "output": 0.1 + } }, { - "id": "o3-pro", - "name": "o3-pro", - "display_name": "o3-pro", + "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "name": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "display_name": "Qwen/Qwen3-Next-80B-A3B-Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262000, + "output": 262000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-06-10", - "last_updated": "2025-06-10", + "release_date": "2025-09-25", + "last_updated": "2025-11-25", "cost": { - "input": 20, - "output": 80 - }, - "type": "chat" + "input": 0.14, + "output": 0.57 + } }, { - "id": "gpt-4o-2024-11-20", - "name": "GPT-4o (2024-11-20)", - "display_name": "GPT-4o (2024-11-20)", + "id": "zai-org/GLM-4.6V", + "name": "zai-org/GLM-4.6V", + "display_name": "zai-org/GLM-4.6V", "modalities": { "input": [ "text", @@ -43227,135 +41395,119 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-11-20", - "last_updated": "2024-11-20", + "release_date": "2025-12-07", + "last_updated": "2025-12-07", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 - }, - "type": "chat" + "input": 0.3, + "output": 0.9 + } }, { - "id": "gpt-5.1-codex-max", - "name": "GPT-5.1 Codex Max", - "display_name": "GPT-5.1 Codex Max", + "id": "zai-org/GLM-4.5", + "name": "zai-org/GLM-4.5", + "display_name": "zai-org/GLM-4.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131000, + "output": 131000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-07-28", + "last_updated": "2025-11-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 - }, - "type": "chat" + "input": 0.4, + "output": 2 + } }, { - "id": "o3", - "name": "o3", - "display_name": "o3", + "id": "zai-org/GLM-4.7", + "name": "zai-org/GLM-4.7", + "display_name": "zai-org/GLM-4.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 205000, + "output": 205000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 - }, - "type": "chat" + "input": 0.6, + "output": 2.2 + } }, { - "id": "o4-mini-deep-research", - "name": "o4-mini-deep-research", - "display_name": "o4-mini-deep-research", + "id": "zai-org/GLM-4.6", + "name": "zai-org/GLM-4.6", + "display_name": "zai-org/GLM-4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 205000, + "output": 205000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-06-26", - "last_updated": "2024-06-26", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 - }, - "type": "chat" + "input": 0.5, + "output": 1.9 + } }, { - "id": "gpt-5-chat-latest", - "name": "GPT-5 Chat (latest)", - "display_name": "GPT-5 Chat (latest)", + "id": "zai-org/GLM-4.5V", + "name": "zai-org/GLM-4.5V", + "display_name": "zai-org/GLM-4.5V", "modalities": { "input": [ "text", @@ -43366,133 +41518,119 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 66000, + "output": 66000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-08-13", + "last_updated": "2025-11-25", "cost": { - "input": 1.25, - "output": 10 - }, - "type": "chat" + "input": 0.14, + "output": 0.86 + } }, { - "id": "gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "zai-org/GLM-4.5-Air", + "name": "zai-org/GLM-4.5-Air", + "display_name": "zai-org/GLM-4.5-Air", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2025-07-28", + "last_updated": "2025-11-25", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 - }, - "type": "chat" + "input": 0.14, + "output": 0.86 + } }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "deepseek-ai/DeepSeek-R1", + "name": "deepseek-ai/DeepSeek-R1", + "display_name": "deepseek-ai/DeepSeek-R1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 164000, + "output": 164000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-05-28", + "last_updated": "2025-11-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 - }, - "type": "chat" + "input": 0.5, + "output": 2.18 + } }, { - "id": "gpt-5-pro", - "name": "GPT-5 Pro", - "display_name": "GPT-5 Pro", + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 272000 + "context": 131000, + "output": 131000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "release_date": "2025-01-20", + "last_updated": "2025-11-25", "cost": { - "input": 15, - "output": 120 - }, - "type": "chat" + "input": 0.18, + "output": 0.18 + } }, { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "deepseek-ai/deepseek-vl2", + "name": "deepseek-ai/deepseek-vl2", + "display_name": "deepseek-ai/deepseek-vl2", "modalities": { "input": [ "text", @@ -43503,88 +41641,69 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 4000, + "output": 4000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2024-12-13", + "last_updated": "2025-11-25", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 - }, - "type": "chat" + "input": 0.15, + "output": 0.15 + } }, { - "id": "gpt-5.1-chat-latest", - "name": "GPT-5.1 Chat", - "display_name": "GPT-5.1 Chat", + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131000, + "output": 131000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-01-20", + "last_updated": "2025-11-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 - }, - "type": "chat" - } - ] - }, - "zhipuai-coding-plan": { - "id": "zhipuai-coding-plan", - "name": "Zhipu AI Coding Plan", - "display_name": "Zhipu AI Coding Plan", - "api": "https://open.bigmodel.cn/api/coding/paas/v4", - "doc": "https://docs.bigmodel.cn/cn/coding-plan/overview", - "models": [ + "input": 0.1, + "output": 0.1 + } + }, { - "id": "glm-4.6v-flash", - "name": "GLM-4.6V-Flash", - "display_name": "GLM-4.6V-Flash", + "id": "deepseek-ai/DeepSeek-V3.2-Exp", + "name": "deepseek-ai/DeepSeek-V3.2-Exp", + "display_name": "deepseek-ai/DeepSeek-V3.2-Exp", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, @@ -43592,34 +41711,30 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "attachment": false, + "open_weights": false, + "release_date": "2025-10-10", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.27, + "output": 0.41 + } }, { - "id": "glm-4.6v", - "name": "GLM-4.6V", - "display_name": "GLM-4.6V", + "id": "deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "deepseek-ai/DeepSeek-V3.1-Terminus", + "display_name": "deepseek-ai/DeepSeek-V3.1-Terminus", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, @@ -43627,21 +41742,19 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "attachment": false, + "open_weights": false, + "release_date": "2025-09-29", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.27, + "output": 1 + } }, { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", "modalities": { "input": [ "text" @@ -43651,8 +41764,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 33000, + "output": 16000 }, "temperature": true, "tool_call": true, @@ -43661,35 +41774,29 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "open_weights": false, + "release_date": "2025-01-20", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, - "type": "chat" + "input": 0.05, + "output": 0.05 + } }, { - "id": "glm-4.5v", - "name": "GLM-4.5V", - "display_name": "GLM-4.5V", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "deepseek-ai/DeepSeek-V3.2", + "display_name": "deepseek-ai/DeepSeek-V3.2", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 16384 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, @@ -43697,21 +41804,19 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "attachment": false, + "open_weights": false, + "release_date": "2025-12-03", + "last_updated": "2025-12-03", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.27, + "output": 0.42 + } }, { - "id": "glm-4.5-air", - "name": "GLM-4.5-Air", - "display_name": "GLM-4.5-Air", + "id": "deepseek-ai/DeepSeek-V3", + "name": "deepseek-ai/DeepSeek-V3", + "display_name": "deepseek-ai/DeepSeek-V3", "modalities": { "input": [ "text" @@ -43721,32 +41826,27 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": false, + "release_date": "2024-12-26", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, - "type": "chat" + "input": 0.25, + "output": 1 + } }, { - "id": "glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "deepseek-ai/DeepSeek-V3.1", + "name": "deepseek-ai/DeepSeek-V3.1", + "display_name": "deepseek-ai/DeepSeek-V3.1", "modalities": { "input": [ "text" @@ -43756,8 +41856,8 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, @@ -43766,133 +41866,128 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": false, + "release_date": "2025-08-25", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, - "type": "chat" - }, + "input": 0.27, + "output": 1 + } + } + ] + }, + "helicone": { + "id": "helicone", + "name": "Helicone", + "display_name": "Helicone", + "api": "https://ai-gateway.helicone.ai/v1", + "doc": "https://helicone.ai/models", + "models": [ { - "id": "glm-4.5-flash", - "name": "GLM-4.5-Flash", - "display_name": "GLM-4.5-Flash", + "id": "gpt-4.1-nano", + "name": "OpenAI GPT-4.1 Nano", + "display_name": "OpenAI GPT-4.1 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, + "open_weights": false, "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, - "type": "chat" + "input": 0.09999999999999999, + "output": 0.39999999999999997, + "cache_read": 0.024999999999999998 + } }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "grok-4-fast-non-reasoning", + "name": "xAI Grok 4 Fast Non-Reasoning", + "display_name": "xAI Grok 4 Fast Non-Reasoning", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": false, + "knowledge": "2025-09", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, - "type": "chat" - } - ] - }, - "minimax-cn": { - "id": "minimax-cn", - "name": "MiniMax (China)", - "display_name": "MiniMax (China)", - "api": "https://api.minimaxi.com/anthropic/v1", - "doc": "https://platform.minimaxi.com/docs/guides/quickstart", - "models": [ + "input": 0.19999999999999998, + "output": 0.5, + "cache_read": 0.049999999999999996 + } + }, { - "id": "MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "qwen3-coder", + "name": "Qwen3 Coder 480B A35B Instruct Turbo", + "display_name": "Qwen3 Coder 480B A35B Instruct Turbo", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.3, - "output": 1.2 - }, - "type": "chat" + "input": 0.22, + "output": 0.95 + } }, { - "id": "MiniMax-M2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "deepseek-v3", + "name": "DeepSeek V3", + "display_name": "DeepSeek V3", "modalities": { "input": [ "text" @@ -43902,69 +41997,64 @@ ] }, "limit": { - "context": 196608, - "output": 128000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2024-12-26", + "last_updated": "2024-12-26", "cost": { - "input": 0.3, - "output": 1.2 - }, - "type": "chat" - } - ] - }, - "perplexity": { - "id": "perplexity", - "name": "Perplexity", - "display_name": "Perplexity", - "doc": "https://docs.perplexity.ai", - "models": [ + "input": 0.56, + "output": 1.68, + "cache_read": 0.07 + } + }, { - "id": "sonar", - "name": "Sonar", - "display_name": "Sonar", + "id": "claude-opus-4", + "name": "Anthropic: Claude Opus 4", + "display_name": "Anthropic: Claude Opus 4", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "knowledge": "2025-05", + "release_date": "2025-05-14", + "last_updated": "2025-05-14", "cost": { - "input": 1, - "output": 1 - }, - "type": "chat" + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } }, { - "id": "sonar-pro", - "name": "Sonar Pro", - "display_name": "Sonar Pro", + "id": "grok-4-fast-reasoning", + "name": "xAI: Grok 4 Fast Reasoning", + "display_name": "xAI: Grok 4 Fast Reasoning", "modalities": { "input": [ "text", @@ -43975,103 +42065,96 @@ ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 2000000, + "output": 2000000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", + "knowledge": "2025-09", + "release_date": "2025-09-01", "last_updated": "2025-09-01", "cost": { - "input": 3, - "output": 15 - }, - "type": "chat" + "input": 0.19999999999999998, + "output": 0.5, + "cache_read": 0.049999999999999996 + } }, { - "id": "sonar-reasoning-pro", - "name": "Sonar Reasoning Pro", - "display_name": "Sonar Reasoning Pro", + "id": "llama-3.1-8b-instant", + "name": "Meta Llama 3.1 8B Instant", + "display_name": "Meta Llama 3.1 8B Instant", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 32678 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "knowledge": "2024-07", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 2, - "output": 8 - }, - "type": "chat" - } - ] - }, - "ovhcloud": { - "id": "ovhcloud", - "name": "OVHcloud AI Endpoints", - "display_name": "OVHcloud AI Endpoints", - "api": "https://oai.endpoints.kepler.ai.cloud.ovh.net/v1", - "doc": "https://www.ovhcloud.com/en/public-cloud/ai-endpoints/catalog//", - "models": [ + "input": 0.049999999999999996, + "output": 0.08 + } + }, { - "id": "mixtral-8x7b-instruct-v0.1", - "name": "Mixtral-8x7B-Instruct-v0.1", - "display_name": "Mixtral-8x7B-Instruct-v0.1", + "id": "claude-opus-4-1", + "name": "Anthropic: Claude Opus 4.1", + "display_name": "Anthropic: Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32000, + "context": 200000, "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-01", - "last_updated": "2025-04-01", + "open_weights": false, + "knowledge": "2025-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.7, - "output": 0.7 - }, - "type": "chat" + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } }, { - "id": "mistral-7b-instruct-v0.3", - "name": "Mistral-7B-Instruct-v0.3", - "display_name": "Mistral-7B-Instruct-v0.3", + "id": "grok-4", + "name": "xAI Grok 4", + "display_name": "xAI Grok 4", "modalities": { "input": [ "text" @@ -44081,8 +42164,8 @@ ] }, "limit": { - "context": 127000, - "output": 127000 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -44090,30 +42173,33 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-01", - "last_updated": "2025-04-01", + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2024-07-09", + "last_updated": "2024-07-09", "cost": { - "input": 0.11, - "output": 0.11 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.75 + } }, { - "id": "llama-3.1-8b-instruct", - "name": "Llama-3.1-8B-Instruct", - "display_name": "Llama-3.1-8B-Instruct", + "id": "qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 262000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -44121,19 +42207,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-06-11", - "last_updated": "2025-06-11", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.11, - "output": 0.11 - }, - "type": "chat" + "input": 0.14, + "output": 1.4 + } }, { - "id": "qwen2.5-vl-72b-instruct", - "name": "Qwen2.5-VL-72B-Instruct", - "display_name": "Qwen2.5-VL-72B-Instruct", + "id": "llama-4-maverick", + "name": "Meta Llama 4 Maverick 17B 128E", + "display_name": "Meta Llama 4 Maverick 17B 128E", "modalities": { "input": [ "text", @@ -44144,28 +42230,28 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-03-31", - "last_updated": "2025-03-31", + "attachment": false, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1.01, - "output": 1.01 - }, - "type": "chat" + "input": 0.15, + "output": 0.6 + } }, { - "id": "mistral-nemo-instruct-2407", - "name": "Mistral-Nemo-Instruct-2407", - "display_name": "Mistral-Nemo-Instruct-2407", + "id": "llama-prompt-guard-2-86m", + "name": "Meta Llama Prompt Guard 2 86M", + "display_name": "Meta Llama Prompt Guard 2 86M", "modalities": { "input": [ "text" @@ -44175,28 +42261,28 @@ ] }, "limit": { - "context": 118000, - "output": 118000 + "context": 512, + "output": 2 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-11-20", - "last_updated": "2024-11-20", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 0.14, - "output": 0.14 - }, - "type": "chat" + "input": 0.01, + "output": 0.01 + } }, { - "id": "mistral-small-3.2-24b-instruct-2506", - "name": "Mistral-Small-3.2-24B-Instruct-2506", - "display_name": "Mistral-Small-3.2-24B-Instruct-2506", + "id": "grok-4-1-fast-reasoning", + "name": "xAI Grok 4.1 Fast Reasoning", + "display_name": "xAI Grok 4.1 Fast Reasoning", "modalities": { "input": [ "text", @@ -44207,28 +42293,30 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-07-16", - "last_updated": "2025-07-16", + "attachment": false, + "open_weights": false, + "knowledge": "2025-11", + "release_date": "2025-11-17", + "last_updated": "2025-11-17", "cost": { - "input": 0.1, - "output": 0.31 - }, - "type": "chat" + "input": 0.19999999999999998, + "output": 0.5, + "cache_read": 0.049999999999999996 + } }, { - "id": "qwen2.5-coder-32b-instruct", - "name": "Qwen2.5-Coder-32B-Instruct", - "display_name": "Qwen2.5-Coder-32B-Instruct", + "id": "grok-code-fast-1", + "name": "xAI Grok Code Fast 1", + "display_name": "xAI Grok Code Fast 1", "modalities": { "input": [ "text" @@ -44238,39 +42326,41 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 256000, + "output": 10000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2024-08-25", + "last_updated": "2024-08-25", "cost": { - "input": 0.96, - "output": 0.96 - }, - "type": "chat" + "input": 0.19999999999999998, + "output": 1.5, + "cache_read": 0.02 + } }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3-Coder-30B-A3B-Instruct", - "display_name": "Qwen3-Coder-30B-A3B-Instruct", + "id": "claude-4.5-haiku", + "name": "Anthropic: Claude 4.5 Haiku", + "display_name": "Anthropic: Claude 4.5 Haiku", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -44278,176 +42368,151 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-10-28", - "last_updated": "2025-10-28", + "open_weights": false, + "knowledge": "2025-10", + "release_date": "2025-10-01", + "last_updated": "2025-10-01", "cost": { - "input": 0.07, - "output": 0.26 - }, - "type": "chat" + "input": 1, + "output": 5, + "cache_read": 0.09999999999999999, + "cache_write": 1.25 + } }, { - "id": "llava-next-mistral-7b", - "name": "llava-next-mistral-7b", - "display_name": "llava-next-mistral-7b", + "id": "llama-3.1-8b-instruct-turbo", + "name": "Meta Llama 3.1 8B Instruct Turbo", + "display_name": "Meta Llama 3.1 8B Instruct Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 128000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-01-08", - "last_updated": "2025-01-08", + "attachment": false, + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.32, - "output": 0.32 - }, - "type": "chat" + "input": 0.02, + "output": 0.03 + } }, { - "id": "deepseek-r1-distill-llama-70b", - "name": "DeepSeek-R1-Distill-Llama-70B", - "display_name": "DeepSeek-R1-Distill-Llama-70B", + "id": "gpt-5.1-codex", + "name": "OpenAI: GPT-5.1 Codex", + "display_name": "OpenAI: GPT-5.1 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-01-30", - "last_updated": "2025-01-30", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.74, - "output": 0.74 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 + } }, { - "id": "meta-llama-3_1-70b-instruct", - "name": "Meta-Llama-3_1-70B-Instruct", - "display_name": "Meta-Llama-3_1-70B-Instruct", + "id": "gpt-4.1-mini-2025-04-14", + "name": "OpenAI GPT-4.1 Mini", + "display_name": "OpenAI GPT-4.1 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 1047576, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-01", - "last_updated": "2025-04-01", - "cost": { - "input": 0.74, - "output": 0.74 - }, - "type": "chat" - }, - { - "id": "gpt-oss-20b", - "name": "gpt-oss-20b", - "display_name": "gpt-oss-20b", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131000, - "output": 131000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.05, - "output": 0.18 - }, - "type": "chat" + "input": 0.39999999999999997, + "output": 1.5999999999999999, + "cache_read": 0.09999999999999999 + } }, { - "id": "gpt-oss-120b", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "llama-guard-4", + "name": "Meta Llama Guard 4 12B", + "display_name": "Meta Llama Guard 4 12B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 131072, + "output": 1024 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.09, - "output": 0.47 - }, - "type": "chat" + "input": 0.21, + "output": 0.21 + } }, { - "id": "meta-llama-3_3-70b-instruct", - "name": "Meta-Llama-3_3-70B-Instruct", - "display_name": "Meta-Llama-3_3-70B-Instruct", + "id": "llama-3.1-8b-instruct", + "name": "Meta Llama 3.1 8B Instruct", + "display_name": "Meta Llama 3.1 8B Instruct", "modalities": { "input": [ "text" @@ -44457,8 +42522,8 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 16384, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -44466,30 +42531,33 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-01", - "last_updated": "2025-04-01", + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.74, - "output": 0.74 - }, - "type": "chat" + "input": 0.02, + "output": 0.049999999999999996 + } }, { - "id": "qwen3-32b", - "name": "Qwen3-32B", - "display_name": "Qwen3-32B", + "id": "gemini-3-pro-preview", + "name": "Google Gemini 3 Pro Preview", + "display_name": "Google Gemini 3 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -44498,27 +42566,20 @@ "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-07-16", - "last_updated": "2025-07-16", + "open_weights": false, + "knowledge": "2025-11", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.09, - "output": 0.25 - }, - "type": "chat" - } - ] - }, - "v0": { - "id": "v0", - "name": "v0", - "display_name": "v0", - "doc": "https://sdk.vercel.ai/providers/ai-sdk-providers/vercel", - "models": [ + "input": 2, + "output": 12, + "cache_read": 0.19999999999999998 + } + }, { - "id": "v0-1.5-lg", - "name": "v0-1.5-lg", - "display_name": "v0-1.5-lg", + "id": "gemini-2.5-flash", + "name": "Google Gemini 2.5 Flash", + "display_name": "Google Gemini 2.5 Flash", "modalities": { "input": [ "text", @@ -44529,8 +42590,8 @@ ] }, "limit": { - "context": 512000, - "output": 32000 + "context": 1048576, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -44538,20 +42599,22 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-06-09", - "last_updated": "2025-06-09", + "knowledge": "2025-06", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 15, - "output": 75 - }, - "type": "chat" + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.3 + } }, { - "id": "v0-1.5-md", - "name": "v0-1.5-md", - "display_name": "v0-1.5-md", + "id": "gpt-4.1-mini", + "name": "OpenAI GPT-4.1 Mini", + "display_name": "OpenAI GPT-4.1 Mini", "modalities": { "input": [ "text", @@ -44562,33 +42625,32 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-06-09", - "last_updated": "2025-06-09", + "knowledge": "2025-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 3, - "output": 15 - }, - "type": "chat" + "input": 0.39999999999999997, + "output": 1.5999999999999999, + "cache_read": 0.09999999999999999 + } }, { - "id": "v0-1.0-md", - "name": "v0-1.0-md", - "display_name": "v0-1.0-md", + "id": "deepseek-v3.1-terminus", + "name": "DeepSeek V3.1 Terminus", + "display_name": "DeepSeek V3.1 Terminus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -44596,7 +42658,7 @@ }, "limit": { "context": 128000, - "output": 32000 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -44604,29 +42666,21 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-09", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 3, - "output": 15 - }, - "type": "chat" - } - ] - }, - "iflowcn": { - "id": "iflowcn", - "name": "iFlow", - "display_name": "iFlow", - "api": "https://apis.iflow.cn/v1", - "doc": "https://platform.iflow.cn/en/docs", - "models": [ + "input": 0.27, + "output": 1, + "cache_read": 0.21600000000000003 + } + }, { - "id": "qwen3-coder", - "name": "Qwen3-Coder-480B-A35B", - "display_name": "Qwen3-Coder-480B-A35B", + "id": "llama-prompt-guard-2-22m", + "name": "Meta Llama Prompt Guard 2 22M", + "display_name": "Meta Llama Prompt Guard 2 22M", "modalities": { "input": [ "text" @@ -44636,40 +42690,40 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 512, + "output": 2 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.01, + "output": 0.01 + } }, { - "id": "deepseek-v3", - "name": "DeepSeek-V3", - "display_name": "DeepSeek-V3", + "id": "claude-3.5-sonnet-v2", + "name": "Anthropic: Claude 3.5 Sonnet v2", + "display_name": "Anthropic: Claude 3.5 Sonnet v2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -44677,20 +42731,21 @@ "supported": false }, "attachment": false, - "open_weights": true, + "open_weights": false, "knowledge": "2024-10", - "release_date": "2024-12-26", - "last_updated": "2024-12-26", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 + } }, { - "id": "kimi-k2", - "name": "Kimi-K2", - "display_name": "Kimi-K2", + "id": "sonar-deep-research", + "name": "Perplexity Sonar Deep Research", + "display_name": "Perplexity Sonar Deep Research", "modalities": { "input": [ "text" @@ -44700,40 +42755,41 @@ ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 127000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 2, + "output": 8 + } }, { - "id": "deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "gemini-2.5-flash-lite", + "name": "Google Gemini 2.5 Flash Lite", + "display_name": "Google Gemini 2.5 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 1048576, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -44742,30 +42798,32 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-07-22", + "last_updated": "2025-07-22", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.09999999999999999, + "output": 0.39999999999999997, + "cache_read": 0.024999999999999998, + "cache_write": 0.09999999999999999 + } }, { - "id": "deepseek-v3.1", - "name": "DeepSeek-V3.1-Terminus", - "display_name": "DeepSeek-V3.1-Terminus", + "id": "claude-sonnet-4-5-20250929", + "name": "Anthropic: Claude Sonnet 4.5 (20250929)", + "display_name": "Anthropic: Claude Sonnet 4.5 (20250929)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 200000, "output": 64000 }, "temperature": true, @@ -44775,20 +42833,21 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": false, + "knowledge": "2025-09", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 + } }, { - "id": "minimax-m2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "grok-3", + "name": "xAI Grok 3", + "display_name": "xAI Grok 3", "modalities": { "input": [ "text" @@ -44798,34 +42857,33 @@ ] }, "limit": { - "context": 204800, - "output": 131100 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.75 + } }, { - "id": "qwen3-235b", - "name": "Qwen3-235B-A22B", - "display_name": "Qwen3-235B-A22B", + "id": "mistral-small", + "name": "Mistral Small", + "display_name": "Mistral Small", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -44833,29 +42891,27 @@ }, "limit": { "context": 128000, - "output": 32000 + "output": 128000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": false, + "knowledge": "2024-02", + "release_date": "2024-02-26", + "last_updated": "2024-02-26", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 75, + "output": 200 + } }, { - "id": "deepseek-v3.2-chat", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "kimi-k2-0711", + "name": "Kimi K2 (07/11)", + "display_name": "Kimi K2 (07/11)", "modalities": { "input": [ "text" @@ -44865,41 +42921,40 @@ ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-11", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.5700000000000001, + "output": 2.3 + } }, { - "id": "kimi-k2-0905", - "name": "Kimi-K2-0905", - "display_name": "Kimi-K2-0905", + "id": "chatgpt-4o-latest", + "name": "OpenAI ChatGPT-4o", + "display_name": "OpenAI ChatGPT-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -44908,19 +42963,19 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2024-08", + "release_date": "2024-08-14", + "last_updated": "2024-08-14", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 5, + "output": 20, + "cache_read": 2.5 + } }, { - "id": "kimi-k2-thinking", - "name": "Kimi-K2-Thinking", - "display_name": "Kimi-K2-Thinking", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ "text" @@ -44930,30 +42985,28 @@ ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-11", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-07-31", + "last_updated": "2025-07-31", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - }, + "input": 0.09999999999999999, + "output": 0.3 + } + }, { - "id": "qwen3-235b-a22b-thinking-2507", - "name": "Qwen3-235B-A22B-Thinking", - "display_name": "Qwen3-235B-A22B-Thinking", + "id": "kimi-k2-0905", + "name": "Kimi K2 (09/05)", + "display_name": "Kimi K2 (09/05)", "modalities": { "input": [ "text" @@ -44963,63 +43016,61 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "open_weights": false, + "knowledge": "2025-09", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.5, + "output": 2, + "cache_read": 0.39999999999999997 + } }, { - "id": "qwen3-vl-plus", - "name": "Qwen3-VL-Plus", - "display_name": "Qwen3-VL-Plus", + "id": "sonar-reasoning", + "name": "Perplexity Sonar Reasoning", + "display_name": "Perplexity Sonar Reasoning", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 127000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 1, + "output": 5 + } }, { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "llama-3.3-70b-instruct", + "name": "Meta Llama 3.3 70B Instruct", + "display_name": "Meta Llama 3.3 70B Instruct", "modalities": { "input": [ "text" @@ -45029,62 +43080,62 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 128000, + "output": 16400 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2025-11-13", + "knowledge": "2024-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.13, + "output": 0.39 + } }, { - "id": "tstars2.0", - "name": "TStars-2.0", - "display_name": "TStars-2.0", + "id": "gpt-5.1-codex-mini", + "name": "OpenAI: GPT-5.1 Codex Mini", + "display_name": "OpenAI: GPT-5.1 Codex Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-01", - "release_date": "2024-01-01", + "knowledge": "2025-01", + "release_date": "2025-01-01", "last_updated": "2025-01-01", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.25, + "output": 2, + "cache_read": 0.024999999999999998 + } }, { - "id": "qwen3-235b-a22b-instruct", - "name": "Qwen3-235B-A22B-Instruct", - "display_name": "Qwen3-235B-A22B-Instruct", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -45095,7 +43146,7 @@ }, "limit": { "context": 256000, - "output": 64000 + "output": 262144 }, "temperature": true, "tool_call": true, @@ -45103,20 +43154,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "open_weights": false, + "knowledge": "2025-11", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.48, + "output": 2 + } }, { - "id": "qwen3-max", - "name": "Qwen3-Max", - "display_name": "Qwen3-Max", + "id": "o3-mini", + "name": "OpenAI o3 Mini", + "display_name": "OpenAI o3 Mini", "modalities": { "input": [ "text" @@ -45126,166 +43176,164 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2023-10", + "release_date": "2023-10-01", + "last_updated": "2023-10-01", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + } }, { - "id": "deepseek-v3.2", - "name": "DeepSeek-V3.2-Exp", - "display_name": "DeepSeek-V3.2-Exp", + "id": "claude-4.5-sonnet", + "name": "Anthropic: Claude Sonnet 4.5", + "display_name": "Anthropic: Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 200000, "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": false, + "knowledge": "2025-09", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 + } }, { - "id": "qwen3-max-preview", - "name": "Qwen3-Max-Preview", - "display_name": "Qwen3-Max-Preview", + "id": "gpt-5.1", + "name": "OpenAI GPT-5.1", + "display_name": "OpenAI GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-12", + "knowledge": "2025-01", "release_date": "2025-01-01", "last_updated": "2025-01-01", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 + } }, { - "id": "qwen3-coder-plus", - "name": "Qwen3-Coder-Plus", - "display_name": "Qwen3-Coder-Plus", + "id": "codex-mini-latest", + "name": "OpenAI Codex Mini Latest", + "display_name": "OpenAI Codex Mini Latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 1.5, + "output": 6, + "cache_read": 0.375 + } }, { - "id": "qwen3-32b", - "name": "Qwen3-32B", - "display_name": "Qwen3-32B", + "id": "gpt-5-nano", + "name": "OpenAI GPT-5 Nano", + "display_name": "OpenAI GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - } - ] - }, - "synthetic": { - "id": "synthetic", - "name": "Synthetic", - "display_name": "Synthetic", - "api": "https://api.synthetic.new/v1", - "doc": "https://synthetic.new/pricing", - "models": [ + "input": 0.049999999999999996, + "output": 0.39999999999999997, + "cache_read": 0.005 + } + }, { - "id": "hf:Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen 3 235B Instruct", - "display_name": "Qwen 3 235B Instruct", + "id": "gpt-5-codex", + "name": "OpenAI: GPT-5 Codex", + "display_name": "OpenAI: GPT-5 Codex", "modalities": { "input": [ "text" @@ -45295,61 +43343,62 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04-28", - "last_updated": "2025-07-21", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.2, - "output": 0.6 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 + } }, { - "id": "hf:Qwen/Qwen2.5-Coder-32B-Instruct", - "name": "Qwen2.5-Coder-32B-Instruct", - "display_name": "Qwen2.5-Coder-32B-Instruct", + "id": "gpt-4o", + "name": "OpenAI GPT-4o", + "display_name": "OpenAI GPT-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-11-11", - "last_updated": "2024-11-11", + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 0.8, - "output": 0.8 - }, - "type": "chat" + "input": 2.5, + "output": 10, + "cache_read": 1.25 + } }, { - "id": "hf:Qwen/Qwen3-Coder-480B-A35B-Instruct", - "name": "Qwen 3 Coder 480B", - "display_name": "Qwen 3 Coder 480B", + "id": "deepseek-tng-r1t2-chimera", + "name": "DeepSeek TNG R1T2 Chimera", + "display_name": "DeepSeek TNG R1T2 Chimera", "modalities": { "input": [ "text" @@ -45359,8 +43408,8 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 130000, + "output": 163840 }, "temperature": true, "tool_call": true, @@ -45368,31 +43417,31 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-07-02", + "last_updated": "2025-07-02", "cost": { - "input": 2, - "output": 2 - }, - "type": "chat" + "input": 0.3, + "output": 1.2 + } }, { - "id": "hf:Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "claude-4.5-opus", + "name": "Anthropic: Claude Opus 4.5", + "display_name": "Anthropic: Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -45401,52 +43450,54 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "open_weights": false, + "knowledge": "2025-11", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.65, - "output": 3 - }, - "type": "chat" + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + } }, { - "id": "hf:MiniMaxAI/MiniMax-M2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "gpt-4.1", + "name": "OpenAI GPT-4.1", + "display_name": "OpenAI GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 131000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.55, - "output": 2.19 - }, - "type": "chat" + "input": 2, + "output": 8, + "cache_read": 0.5 + } }, { - "id": "hf:MiniMaxAI/MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "sonar", + "name": "Perplexity Sonar", + "display_name": "Perplexity Sonar", "modalities": { "input": [ "text" @@ -45456,29 +43507,28 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 127000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 0.55, - "output": 2.19 - }, - "type": "chat" + "input": 1, + "output": 1 + } }, { - "id": "hf:meta-llama/Llama-3.1-70B-Instruct", - "name": "Llama-3.1-70B-Instruct", - "display_name": "Llama-3.1-70B-Instruct", + "id": "glm-4.6", + "name": "Zai GLM-4.6", + "display_name": "Zai GLM-4.6", "modalities": { "input": [ "text" @@ -45488,8 +43538,8 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -45498,152 +43548,149 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.9, - "output": 0.9 - }, - "type": "chat" + "input": 0.44999999999999996, + "output": 1.5 + } }, { - "id": "hf:meta-llama/Llama-3.1-8B-Instruct", - "name": "Llama-3.1-8B-Instruct", - "display_name": "Llama-3.1-8B-Instruct", + "id": "o4-mini", + "name": "OpenAI o4 Mini", + "display_name": "OpenAI o4 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.2, - "output": 0.2 - }, - "type": "chat" + "input": 1.1, + "output": 4.4, + "cache_read": 0.275 + } }, { - "id": "hf:meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "qwen3-235b-a22b-thinking", + "name": "Qwen3 235B A22B Thinking", + "display_name": "Qwen3 235B A22B Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 262144, + "output": 81920 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 0.9, - "output": 0.9 - }, - "type": "chat" + "input": 0.3, + "output": 2.9000000000000004 + } }, { - "id": "hf:meta-llama/Llama-4-Scout-17B-16E-Instruct", - "name": "Llama-4-Scout-17B-16E-Instruct", - "display_name": "Llama-4-Scout-17B-16E-Instruct", + "id": "hermes-2-pro-llama-3-8b", + "name": "Hermes 2 Pro Llama 3 8B", + "display_name": "Hermes 2 Pro Llama 3 8B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 328000, - "output": 4096 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "attachment": false, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-05-27", + "last_updated": "2024-05-27", "cost": { - "input": 0.15, - "output": 0.6 - }, - "type": "chat" + "input": 0.14, + "output": 0.14 + } }, { - "id": "hf:meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", - "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", - "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "id": "o1", + "name": "OpenAI: o1", + "display_name": "OpenAI: o1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 524000, - "output": 4096 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "attachment": false, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.22, - "output": 0.88 - }, - "type": "chat" + "input": 15, + "output": 60, + "cache_read": 7.5 + } }, { - "id": "hf:meta-llama/Llama-3.1-405B-Instruct", - "name": "Llama-3.1-405B-Instruct", - "display_name": "Llama-3.1-405B-Instruct", + "id": "grok-3-mini", + "name": "xAI Grok 3 Mini", + "display_name": "xAI Grok 3 Mini", "modalities": { "input": [ "text" @@ -45653,30 +43700,29 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 3, - "output": 3 - }, - "type": "chat" + "input": 0.3, + "output": 0.5, + "cache_read": 0.075 + } }, { - "id": "hf:moonshotai/Kimi-K2-Instruct-0905", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "sonar-pro", + "name": "Perplexity Sonar Pro", + "display_name": "Perplexity Sonar Pro", "modalities": { "input": [ "text" @@ -45686,62 +43732,61 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 200000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 1.2, - "output": 1.2 - }, - "type": "chat" + "input": 3, + "output": 15 + } }, { - "id": "hf:moonshotai/Kimi-K2-Thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "gpt-5-mini", + "name": "OpenAI GPT-5 Mini", + "display_name": "OpenAI GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-11", - "release_date": "2025-11-07", - "last_updated": "2025-11-07", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.55, - "output": 2.19 - }, - "type": "chat" + "input": 0.25, + "output": 2, + "cache_read": 0.024999999999999998 + } }, { - "id": "hf:zai-org/GLM-4.5", - "name": "GLM 4.5", - "display_name": "GLM 4.5", + "id": "deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ "text" @@ -45752,7 +43797,7 @@ }, "limit": { "context": 128000, - "output": 96000 + "output": 4096 }, "temperature": true, "tool_call": true, @@ -45761,20 +43806,19 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.55, - "output": 2.19 - }, - "type": "chat" + "input": 0.03, + "output": 0.13 + } }, { - "id": "hf:zai-org/GLM-4.7", - "name": "GLM 4.7", - "display_name": "GLM 4.7", + "id": "o1-mini", + "name": "OpenAI: o1-mini", + "display_name": "OpenAI: o1-mini", "modalities": { "input": [ "text" @@ -45784,33 +43828,33 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.55, - "output": 2.19 - }, - "type": "chat" + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + } }, { - "id": "hf:zai-org/GLM-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "claude-3.7-sonnet", + "name": "Anthropic: Claude 3.7 Sonnet", + "display_name": "Anthropic: Claude 3.7 Sonnet", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -45823,89 +43867,90 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "open_weights": false, + "knowledge": "2025-02", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.55, - "output": 2.19 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 + } }, { - "id": "hf:deepseek-ai/DeepSeek-R1", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", + "id": "claude-3-haiku-20240307", + "name": "Anthropic: Claude 3 Haiku", + "display_name": "Anthropic: Claude 3 Haiku", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2024-03-07", + "last_updated": "2024-03-07", "cost": { - "input": 0.55, - "output": 2.19 - }, - "type": "chat" + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 + } }, { - "id": "hf:deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek R1 (0528)", - "display_name": "DeepSeek R1 (0528)", + "id": "o3-pro", + "name": "OpenAI o3 Pro", + "display_name": "OpenAI o3 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-01", - "last_updated": "2025-08-01", + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 3, - "output": 8 - }, - "type": "chat" + "input": 20, + "output": 80 + } }, { - "id": "hf:deepseek-ai/DeepSeek-V3.1-Terminus", - "name": "DeepSeek V3.1 Terminus", - "display_name": "DeepSeek V3.1 Terminus", + "id": "qwen2.5-coder-7b-fast", + "name": "Qwen2.5 Coder 7B fast", + "display_name": "Qwen2.5 Coder 7B fast", "modalities": { "input": [ "text" @@ -45915,29 +43960,28 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 32000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-22", - "last_updated": "2025-09-25", + "knowledge": "2024-09", + "release_date": "2024-09-15", + "last_updated": "2024-09-15", "cost": { - "input": 1.2, - "output": 1.2 - }, - "type": "chat" + "input": 0.03, + "output": 0.09 + } }, { - "id": "hf:deepseek-ai/DeepSeek-V3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "deepseek-reasoner", + "name": "DeepSeek Reasoner", + "display_name": "DeepSeek Reasoner", "modalities": { "input": [ "text" @@ -45947,42 +43991,41 @@ ] }, "limit": { - "context": 162816, - "output": 8000 + "context": 128000, + "output": 64000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.27, - "output": 0.4, - "cache_read": 0.27, - "cache_write": 0 - }, - "type": "chat" + "input": 0.56, + "output": 1.68, + "cache_read": 0.07 + } }, { - "id": "hf:deepseek-ai/DeepSeek-V3", - "name": "DeepSeek V3", - "display_name": "DeepSeek V3", + "id": "gemini-2.5-pro", + "name": "Google Gemini 2.5 Pro", + "display_name": "Google Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -45991,55 +44034,57 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-05-29", + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { "input": 1.25, - "output": 1.25 - }, - "type": "chat" + "output": 10, + "cache_read": 0.3125, + "cache_write": 1.25 + } }, { - "id": "hf:deepseek-ai/DeepSeek-V3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "gemma-3-12b-it", + "name": "Google Gemma 3 12B", + "display_name": "Google Gemma 3 12B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.56, - "output": 1.68 - }, - "type": "chat" + "input": 0.049999999999999996, + "output": 0.09999999999999999 + } }, { - "id": "hf:deepseek-ai/DeepSeek-V3-0324", - "name": "DeepSeek V3 (0324)", - "display_name": "DeepSeek V3 (0324)", + "id": "mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -46047,67 +44092,60 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 16400 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-01", - "last_updated": "2025-08-01", + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 1.2, - "output": 1.2 - }, - "type": "chat" + "input": 20, + "output": 40 + } }, { - "id": "hf:openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "o3", + "name": "OpenAI o3", + "display_name": "OpenAI o3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.1, - "output": 0.1 - }, - "type": "chat" - } - ] - }, - "deepinfra": { - "id": "deepinfra", - "name": "Deep Infra", - "display_name": "Deep Infra", - "doc": "https://deepinfra.com/models", - "models": [ + "input": 2, + "output": 8, + "cache_read": 0.5 + } + }, { - "id": "moonshotai/Kimi-K2-Instruct", - "name": "Kimi K2", - "display_name": "Kimi K2", + "id": "gpt-oss-20b", + "name": "OpenAI GPT-OSS 20b", + "display_name": "OpenAI GPT-OSS 20b", "modalities": { "input": [ "text" @@ -46118,28 +44156,28 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-11", - "last_updated": "2025-07-11", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.5, - "output": 2 - }, - "type": "chat" + "input": 0.049999999999999996, + "output": 0.19999999999999998 + } }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "gpt-oss-120b", + "name": "OpenAI GPT-OSS 120b", + "display_name": "OpenAI GPT-OSS 120b", "modalities": { "input": [ "text" @@ -46150,7 +44188,7 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 131072 }, "temperature": true, "tool_call": true, @@ -46159,117 +44197,119 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-11-06", - "last_updated": "2025-11-07", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.47, - "output": 2 - }, - "type": "chat" + "input": 0.04, + "output": 0.16 + } }, { - "id": "MiniMaxAI/MiniMax-M2", - "name": "MiniMax M2", - "display_name": "MiniMax M2", + "id": "claude-3.5-haiku", + "name": "Anthropic: Claude 3.5 Haiku", + "display_name": "Anthropic: Claude 3.5 Haiku", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, + "open_weights": false, "knowledge": "2024-10", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.254, - "output": 1.02 - }, - "type": "chat" + "input": 0.7999999999999999, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 + } }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "gpt-5-chat-latest", + "name": "OpenAI GPT-5 Chat Latest", + "display_name": "OpenAI GPT-5 Chat Latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 128000, "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "knowledge": "2024-09", + "release_date": "2024-09-30", + "last_updated": "2024-09-30", "cost": { - "input": 0.03, - "output": 0.14 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 + } }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "gpt-4o-mini", + "name": "OpenAI GPT-4o-mini", + "display_name": "OpenAI GPT-4o-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 128000, "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.05, - "output": 0.24 - }, - "type": "chat" + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 + } }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "gemma2-9b-it", + "name": "Google Gemma 2", + "display_name": "Google Gemma 2", "modalities": { "input": [ "text" @@ -46279,61 +44319,63 @@ ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-06-25", + "last_updated": "2024-06-25", "cost": { - "input": 0.4, - "output": 1.6 - }, - "type": "chat" + "input": 0.01, + "output": 0.03 + } }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo", - "name": "Qwen3 Coder 480B A35B Instruct Turbo", - "display_name": "Qwen3 Coder 480B A35B Instruct Turbo", + "id": "claude-sonnet-4", + "name": "Anthropic: Claude Sonnet 4", + "display_name": "Anthropic: Claude Sonnet 4", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2025-05-14", + "last_updated": "2025-05-14", "cost": { - "input": 0.3, - "output": 1.2 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 + } }, { - "id": "zai-org/GLM-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "sonar-reasoning-pro", + "name": "Perplexity Sonar Reasoning Pro", + "display_name": "Perplexity Sonar Reasoning Pro", "modalities": { "input": [ "text" @@ -46343,72 +44385,62 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 127000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 0.6, - "output": 2.2 - }, - "type": "chat" + "input": 2, + "output": 8 + } }, { - "id": "zai-org/GLM-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "gpt-5", + "name": "OpenAI GPT-5", + "display_name": "OpenAI GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.43, - "output": 1.75, - "cache_read": 0.08 - }, - "type": "chat" - } - ] - }, - "zhipuai": { - "id": "zhipuai", - "name": "Zhipu AI", - "display_name": "Zhipu AI", - "api": "https://open.bigmodel.cn/api/paas/v4", - "doc": "https://docs.z.ai/guides/overview/pricing", - "models": [ + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 + } + }, { - "id": "glm-4.6v-flash", - "name": "GLM-4.6V-Flash", - "display_name": "GLM-4.6V-Flash", + "id": "qwen3-vl-235b-a22b-instruct", + "name": "Qwen3 VL 235B A22B Instruct", + "display_name": "Qwen3 VL 235B A22B Instruct", "modalities": { "input": [ "text", @@ -46420,65 +44452,60 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "attachment": false, + "open_weights": false, + "knowledge": "2025-09", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.3, + "output": 1.5 + } }, { - "id": "glm-4.6v", - "name": "GLM-4.6V", - "display_name": "GLM-4.6V", + "id": "qwen3-30b-a3b", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 41000, + "output": 41000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "attachment": false, + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "cost": { - "input": 0.3, - "output": 0.9 - }, - "type": "chat" + "input": 0.08, + "output": 0.29 + } }, { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -46488,67 +44515,62 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "open_weights": false, + "knowledge": "2025-09", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 - }, - "type": "chat" + "input": 0.27, + "output": 0.41 + } }, { - "id": "glm-4.5v", - "name": "GLM-4.5V", - "display_name": "GLM-4.5V", + "id": "grok-4-1-fast-non-reasoning", + "name": "xAI Grok 4.1 Fast Non-Reasoning", + "display_name": "xAI Grok 4.1 Fast Non-Reasoning", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 64000, - "output": 16384 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "attachment": false, + "open_weights": false, + "knowledge": "2025-11", + "release_date": "2025-11-17", + "last_updated": "2025-11-17", "cost": { - "input": 0.6, - "output": 1.8 - }, - "type": "chat" + "input": 0.19999999999999998, + "output": 0.5, + "cache_read": 0.049999999999999996 + } }, { - "id": "glm-4.5-air", - "name": "GLM-4.5-Air", - "display_name": "GLM-4.5-Air", + "id": "gpt-5-pro", + "name": "OpenAI: GPT-5 Pro", + "display_name": "OpenAI: GPT-5 Pro", "modalities": { "input": [ "text" @@ -46558,32 +44580,28 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 128000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.2, - "output": 1.1, - "cache_read": 0.03, - "cache_write": 0 - }, - "type": "chat" + "input": 15, + "output": 120 + } }, { - "id": "glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "llama-3.3-70b-versatile", + "name": "Meta Llama 3.3 70B Versatile", + "display_name": "Meta Llama 3.3 70B Versatile", "modalities": { "input": [ "text" @@ -46594,31 +44612,27 @@ }, "limit": { "context": 131072, - "output": 98304 + "output": 32678 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 - }, - "type": "chat" + "input": 0.59, + "output": 0.7899999999999999 + } }, { - "id": "glm-4.5-flash", - "name": "GLM-4.5-Flash", - "display_name": "GLM-4.5-Flash", + "id": "mistral-large-2411", + "name": "Mistral-Large", + "display_name": "Mistral-Large", "modalities": { "input": [ "text" @@ -46628,43 +44642,40 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2024-07-24", + "last_updated": "2024-07-24", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, - "type": "chat" + "input": 2, + "output": 6 + } }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "claude-opus-4-1-20250805", + "name": "Anthropic: Claude Opus 4.1 (20250805)", + "display_name": "Anthropic: Claude Opus 4.1 (20250805)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -46673,31 +44684,21 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": false, + "knowledge": "2025-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 - }, - "type": "chat" - } - ] - }, - "submodel": { - "id": "submodel", - "name": "submodel", - "display_name": "submodel", - "api": "https://llm.submodel.ai/v1", - "doc": "https://submodel.gitbook.io", - "models": [ + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } + }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "ernie-4.5-21b-a3b-thinking", + "name": "Baidu Ernie 4.5 21B A3B Thinking", + "display_name": "Baidu Ernie 4.5 21B A3B Thinking", "modalities": { "input": [ "text" @@ -46707,60 +44708,63 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", + "open_weights": false, + "knowledge": "2025-03", + "release_date": "2025-03-16", + "last_updated": "2025-03-16", "cost": { - "input": 0.1, - "output": 0.5 - }, - "type": "chat" + "input": 0.07, + "output": 0.28 + } }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "gpt-5.1-chat-latest", + "name": "OpenAI GPT-5.1 Chat", + "display_name": "OpenAI GPT-5.1 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.2, - "output": 0.3 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 + } }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ "text" @@ -46770,63 +44774,67 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 40960 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { - "input": 0.2, - "output": 0.8 - }, - "type": "chat" + "input": 0.29, + "output": 0.59 + } }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "claude-haiku-4-5-20251001", + "name": "Anthropic: Claude 4.5 Haiku (20251001)", + "display_name": "Anthropic: Claude 4.5 Haiku (20251001)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", + "open_weights": false, + "knowledge": "2025-10", + "release_date": "2025-10-01", + "last_updated": "2025-10-01", "cost": { - "input": 0.2, - "output": 0.6 - }, - "type": "chat" + "input": 1, + "output": 5, + "cache_read": 0.09999999999999999, + "cache_write": 1.25 + } }, { - "id": "zai-org/GLM-4.5-FP8", - "name": "GLM 4.5 FP8", - "display_name": "GLM 4.5 FP8", + "id": "llama-4-scout", + "name": "Meta Llama 4 Scout 17B 16E", + "display_name": "Meta Llama 4 Scout 17B 16E", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -46834,28 +44842,36 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.2, - "output": 0.8 - }, - "type": "chat" - }, + "input": 0.08, + "output": 0.3 + } + } + ] + }, + "huggingface": { + "id": "huggingface", + "name": "Hugging Face", + "display_name": "Hugging Face", + "api": "https://router.huggingface.co/v1", + "doc": "https://huggingface.co/docs/inference-providers", + "models": [ { - "id": "zai-org/GLM-4.5-Air", - "name": "GLM 4.5 Air", - "display_name": "GLM 4.5 Air", + "id": "moonshotai/Kimi-K2-Instruct", + "name": "Kimi-K2-Instruct", + "display_name": "Kimi-K2-Instruct", "modalities": { "input": [ "text" @@ -46866,7 +44882,7 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -46875,29 +44891,31 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2024-10", + "release_date": "2025-07-14", + "last_updated": "2025-07-14", "cost": { - "input": 0.1, - "output": 0.5 - }, - "type": "chat" + "input": 1, + "output": 3 + } }, { - "id": "deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek R1 0528", - "display_name": "DeepSeek R1 0528", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi-K2.5", + "display_name": "Kimi-K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 75000, - "output": 163840 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -46905,20 +44923,21 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-01", + "last_updated": "2026-01-01", "cost": { - "input": 0.5, - "output": 2.15 - }, - "type": "chat" + "input": 0.6, + "output": 3, + "cache_read": 0.1 + } }, { - "id": "deepseek-ai/DeepSeek-V3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "Kimi-K2-Instruct-0905", + "display_name": "Kimi-K2-Instruct-0905", "modalities": { "input": [ "text" @@ -46928,29 +44947,28 @@ ] }, "limit": { - "context": 75000, - "output": 163840 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-04", + "last_updated": "2025-09-04", "cost": { - "input": 0.2, - "output": 0.8 - }, - "type": "chat" + "input": 1, + "output": 3 + } }, { - "id": "deepseek-ai/DeepSeek-V3-0324", - "name": "DeepSeek V3 0324", - "display_name": "DeepSeek V3 0324", + "id": "moonshotai/Kimi-K2-Thinking", + "name": "Kimi-K2-Thinking", + "display_name": "Kimi-K2-Thinking", "modalities": { "input": [ "text" @@ -46960,37 +44978,30 @@ ] }, "limit": { - "context": 75000, - "output": 163840 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.2, - "output": 0.8 - }, - "type": "chat" - } - ] - }, - "nano-gpt": { - "id": "nano-gpt", - "name": "NanoGPT", - "display_name": "NanoGPT", - "api": "https://nano-gpt.com/api/v1", - "doc": "https://docs.nano-gpt.com", - "models": [ + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 + } + }, { - "id": "moonshotai/kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "MiniMaxAI/MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" @@ -47000,8 +45011,8 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -47010,20 +45021,19 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-11-01", - "last_updated": "2025-12-24", + "open_weights": true, + "knowledge": "2025-10", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 1, - "output": 2 - }, - "type": "chat" + "input": 0.3, + "output": 1.2 + } }, { - "id": "moonshotai/kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "XiaomiMiMo/MiMo-V2-Flash", + "name": "MiMo-V2-Flash", + "display_name": "MiMo-V2-Flash", "modalities": { "input": [ "text" @@ -47033,29 +45043,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-07-18", - "last_updated": "2025-12-24", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "cost": { - "input": 1, - "output": 2 - }, - "type": "chat" + "input": 0.1, + "output": 0.3 + } }, { - "id": "nousresearch/hermes-4-405b:thinking", - "name": "Hermes 4 405b Thinking", - "display_name": "Hermes 4 405b Thinking", + "id": "Qwen/Qwen3-Embedding-8B", + "name": "Qwen 3 Embedding 8B", + "display_name": "Qwen 3 Embedding 8B", "modalities": { "input": [ "text" @@ -47065,29 +45075,28 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 32000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-08-13", - "last_updated": "2025-12-24", + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1, - "output": 2 - }, - "type": "chat" + "input": 0.01, + "output": 0 + } }, { - "id": "nvidia/llama-3_3-nemotron-super-49b-v1_5", - "name": "Llama 3 3 Nemotron Super 49B V1 5", - "display_name": "Llama 3 3 Nemotron Super 49B V1 5", + "id": "Qwen/Qwen3-Embedding-4B", + "name": "Qwen 3 Embedding 4B", + "display_name": "Qwen 3 Embedding 4B", "modalities": { "input": [ "text" @@ -47097,28 +45106,28 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 32000, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-08-08", - "last_updated": "2025-12-24", + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1, - "output": 2 - }, - "type": "chat" + "input": 0.01, + "output": 0 + } }, { - "id": "deepseek/deepseek-v3.2:thinking", - "name": "Deepseek V3.2 Thinking", - "display_name": "Deepseek V3.2 Thinking", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen3-Coder-480B-A35B-Instruct", + "display_name": "Qwen3-Coder-480B-A35B-Instruct", "modalities": { "input": [ "text" @@ -47128,29 +45137,28 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 66536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-01", - "last_updated": "2025-12-24", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 1, + "input": 2, "output": 2 - }, - "type": "chat" + } }, { - "id": "deepseek/deepseek-r1", - "name": "Deepseek R1", - "display_name": "Deepseek R1", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3-235B-A22B-Thinking-2507", + "display_name": "Qwen3-235B-A22B-Thinking-2507", "modalities": { "input": [ "text" @@ -47160,8 +45168,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -47171,19 +45179,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-01-20", - "last_updated": "2025-12-24", + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 1, - "output": 2 - }, - "type": "chat" + "input": 0.3, + "output": 3 + } }, { - "id": "minimax/minimax-m2.1", - "name": "Minimax M2.1", - "display_name": "Minimax M2.1", + "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen3-Next-80B-A3B-Instruct", + "display_name": "Qwen3-Next-80B-A3B-Instruct", "modalities": { "input": [ "text" @@ -47193,8 +45200,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 66536 }, "temperature": true, "tool_call": true, @@ -47202,19 +45209,19 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-23", - "last_updated": "2025-12-24", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-11", + "last_updated": "2025-09-11", "cost": { - "input": 1, - "output": 2 - }, - "type": "chat" + "input": 0.25, + "output": 1 + } }, { - "id": "openai/gpt-oss-120b", - "name": "GPT Oss 120b", - "display_name": "GPT Oss 120b", + "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "name": "Qwen3-Next-80B-A3B-Thinking", + "display_name": "Qwen3-Next-80B-A3B-Thinking", "modalities": { "input": [ "text" @@ -47224,8 +45231,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -47233,20 +45240,19 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-06-23", - "last_updated": "2025-12-24", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-11", + "last_updated": "2025-09-11", "cost": { - "input": 1, + "input": 0.3, "output": 2 - }, - "type": "chat" + } }, { - "id": "z-ai/glm-4.6:thinking", - "name": "GLM 4.6 Thinking", - "display_name": "GLM 4.6 Thinking", + "id": "zai-org/GLM-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -47256,8 +45262,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -47267,18 +45273,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-04-07", - "last_updated": "2025-12-24", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 1, - "output": 2 - }, - "type": "chat" + "input": 0.6, + "output": 2.2, + "cache_read": 0.11 + } }, { - "id": "z-ai/glm-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "zai-org/GLM-4.7-Flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ "text" @@ -47289,28 +45296,28 @@ }, "limit": { "context": 200000, - "output": 8192 + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-11-15", - "last_updated": "2025-12-24", + "knowledge": "2025-04", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 1, - "output": 2 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "qwen/qwen3-coder", - "name": "Qwen3 Coder", - "display_name": "Qwen3 Coder", + "id": "deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ "text" @@ -47320,29 +45327,29 @@ ] }, "limit": { - "context": 106000, - "output": 8192 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-15", - "last_updated": "2025-12-24", + "knowledge": "2025-05", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 1, - "output": 2 - }, - "type": "chat" + "input": 3, + "output": 5 + } }, { - "id": "qwen/qwen3-235b-a22b-thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ "text" @@ -47352,8 +45359,8 @@ ] }, "limit": { - "context": 262144, - "output": 8192 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -47363,19 +45370,27 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-07-01", - "last_updated": "2025-12-24", + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 1, - "output": 2 - }, - "type": "chat" - }, + "input": 0.28, + "output": 0.4 + } + } + ] + }, + "opencode": { + "id": "opencode", + "name": "OpenCode Zen", + "display_name": "OpenCode Zen", + "api": "https://opencode.ai/zen/v1", + "doc": "https://opencode.ai/docs/zen", + "models": [ { - "id": "mistralai/devstral-2-123b-instruct-2512", - "name": "Devstral 2 123b Instruct 2512", - "display_name": "Devstral 2 123b Instruct 2512", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -47385,28 +45400,30 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-12-11", - "last_updated": "2025-12-24", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 1, - "output": 2 - }, - "type": "chat" + "input": 0.6, + "output": 2.2, + "cache_read": 0.1 + } }, { - "id": "mistralai/mistral-large-3-675b-instruct-2512", - "name": "Mistral Large 3 675b Instruct 2512", - "display_name": "Mistral Large 3 675b Instruct 2512", + "id": "qwen3-coder", + "name": "Qwen3 Coder", + "display_name": "Qwen3 Coder", "modalities": { "input": [ "text" @@ -47416,8 +45433,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -47426,51 +45443,54 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-12-02", - "last_updated": "2025-12-24", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 1, - "output": 2 - }, - "type": "chat" + "input": 0.45, + "output": 1.8 + } }, { - "id": "mistralai/ministral-14b-instruct-2512", - "name": "Ministral 14b Instruct 2512", - "display_name": "Ministral 14b Instruct 2512", + "id": "claude-opus-4-1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-01", - "last_updated": "2025-12-24", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1, - "output": 2 - }, - "type": "chat" + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } }, { - "id": "meta-llama/llama-4-maverick", - "name": "Llama 4 Maverick", - "display_name": "Llama 4 Maverick", + "id": "kimi-k2", + "name": "Kimi K2", + "display_name": "Kimi K2", "modalities": { "input": [ "text" @@ -47480,8 +45500,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -47490,126 +45510,137 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-04-05", - "last_updated": "2025-12-24", + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 1, - "output": 2 - }, - "type": "chat" + "input": 0.4, + "output": 2.5, + "cache_read": 0.4 + } }, { - "id": "meta-llama/llama-3.3-70b-instruct", - "name": "Llama 3.3 70b Instruct", - "display_name": "Llama 3.3 70b Instruct", + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2025-12-24", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 1, - "output": 2 - }, - "type": "chat" + "input": 1.75, + "output": 14, + "cache_read": 0.175 + } }, { - "id": "zai-org/glm-4.7", - "name": "GLM 4.7", - "display_name": "GLM 4.7", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-24", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 1, - "output": 2 - }, - "type": "chat" + "input": 1.07, + "output": 8.5, + "cache_read": 0.107 + } }, { - "id": "zai-org/glm-4.5-air", - "name": "GLM 4.5 Air", - "display_name": "GLM 4.5 Air", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-12-24", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { "input": 1, - "output": 2 - }, - "type": "chat" + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 + } }, { - "id": "zai-org/glm-4.7:thinking", - "name": "GLM 4.7 Thinking", - "display_name": "GLM 4.7 Thinking", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -47617,20 +45648,28 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-07", - "last_updated": "2025-12-24", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 1, - "output": 2 - }, - "type": "chat" + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25, + "context_over_200k": { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5 + } + } }, { - "id": "zai-org/glm-4.5-air:thinking", - "name": "GLM 4.5 Air Thinking", - "display_name": "GLM 4.5 Air Thinking", + "id": "trinity-large-preview-free", + "name": "Trinity Large Preview", + "display_name": "Trinity Large Preview", "modalities": { "input": [ "text" @@ -47640,49 +45679,41 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-04-07", - "last_updated": "2025-12-24", + "knowledge": "2025-06", + "release_date": "2026-01-28", + "last_updated": "2026-01-28", "cost": { - "input": 1, - "output": 2 - }, - "type": "chat" - } - ] - }, - "zai": { - "id": "zai", - "name": "Z.AI", - "display_name": "Z.AI", - "api": "https://api.z.ai/api/paas/v4", - "doc": "https://docs.z.ai/guides/overview/pricing", - "models": [ + "input": 0, + "output": 0 + } + }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -47690,34 +45721,35 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 - }, - "type": "chat" + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + } }, { - "id": "glm-4.5-flash", - "name": "GLM-4.5-Flash", - "display_name": "GLM-4.5-Flash", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -47725,34 +45757,36 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2024-10", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, - "type": "chat" + "input": 0.6, + "output": 3, + "cache_read": 0.08 + } }, { - "id": "glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "gemini-3-pro", + "name": "Gemini 3 Pro", + "display_name": "Gemini 3 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -47760,34 +45794,39 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 - }, - "type": "chat" + "input": 2, + "output": 12, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } + } }, { - "id": "glm-4.5-air", - "name": "GLM-4.5-Air", - "display_name": "GLM-4.5-Air", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -47795,58 +45834,62 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", - "cost": { - "input": 0.2, - "output": 1.1, - "cache_read": 0.03, - "cache_write": 0 - }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5 + } + } }, { - "id": "glm-4.5v", - "name": "GLM-4.5V", - "display_name": "GLM-4.5V", + "id": "gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex Mini", + "display_name": "GPT-5.1 Codex Mini", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.6, - "output": 1.8 - }, - "type": "chat" + "input": 0.25, + "output": 2, + "cache_read": 0.025 + } }, { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -47856,8 +45899,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -47867,97 +45910,87 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 - }, - "type": "chat" + "input": 0.4, + "output": 2.5, + "cache_read": 0.4 + } }, { - "id": "glm-4.6v", - "name": "GLM-4.6V", - "display_name": "GLM-4.6V", + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.3, - "output": 0.9 - }, - "type": "chat" - } - ] - }, - "inference": { - "id": "inference", - "name": "Inference", - "display_name": "Inference", - "api": "https://inference.net/v1", - "doc": "https://inference.net/models", - "models": [ + "input": 1.07, + "output": 8.5, + "cache_read": 0.107 + } + }, { - "id": "mistral/mistral-nemo-12b-instruct", - "name": "Mistral Nemo 12B Instruct", - "display_name": "Mistral Nemo 12B Instruct", + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.038, - "output": 0.1 - }, - "type": "chat" + "input": 0, + "output": 0, + "cache_read": 0 + } }, { - "id": "google/gemma-3", - "name": "Google Gemma 3", - "display_name": "Google Gemma 3", + "id": "gpt-5-codex", + "name": "GPT-5 Codex", + "display_name": "GPT-5 Codex", "modalities": { "input": [ "text", @@ -47968,29 +46001,30 @@ ] }, "limit": { - "context": 125000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.15, - "output": 0.3 - }, - "type": "chat" + "input": 1.07, + "output": 8.5, + "cache_read": 0.107 + } }, { - "id": "osmosis/osmosis-structure-0.6b", - "name": "Osmosis Structure 0.6B", - "display_name": "Osmosis Structure 0.6B", + "id": "big-pickle", + "name": "Big Pickle", + "display_name": "Big Pickle", "modalities": { "input": [ "text" @@ -48000,73 +46034,44 @@ ] }, "limit": { - "context": 4000, - "output": 2048 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", - "cost": { - "input": 0.1, - "output": 0.5 - }, - "type": "chat" - }, - { - "id": "qwen/qwen3-embedding-4b", - "name": "Qwen 3 Embedding 4B", - "display_name": "Qwen 3 Embedding 4B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 32000, - "output": 2048 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-10-17", + "last_updated": "2025-10-17", "cost": { - "input": 0.01, - "output": 0 - }, - "type": "embedding" + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } }, { - "id": "qwen/qwen-2.5-7b-vision-instruct", - "name": "Qwen 2.5 7B Vision Instruct", - "display_name": "Qwen 2.5 7B Vision Instruct", + "id": "claude-3-5-haiku", + "name": "Claude Haiku 3.5", + "display_name": "Claude Haiku 3.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 125000, - "output": 4096 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -48074,53 +46079,54 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": false, + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.2, - "output": 0.2 - }, - "type": "chat" + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 + } }, { - "id": "meta/llama-3.2-11b-vision-instruct", - "name": "Llama 3.2 11B Vision Instruct", - "display_name": "Llama 3.2 11B Vision Instruct", + "id": "glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.055, - "output": 0.055 - }, - "type": "chat" + "input": 0.6, + "output": 2.2, + "cache_read": 0.1 + } }, { - "id": "meta/llama-3.1-8b-instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "glm-4.7-free", + "name": "GLM-4.7 Free", + "display_name": "GLM-4.7 Free", "modalities": { "input": [ "text" @@ -48130,29 +46136,30 @@ ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.025, - "output": 0.025 - }, - "type": "chat" + "input": 0, + "output": 0, + "cache_read": 0 + } }, { - "id": "meta/llama-3.2-3b-instruct", - "name": "Llama 3.2 3B Instruct", - "display_name": "Llama 3.2 3B Instruct", + "id": "grok-code", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ "text" @@ -48162,70 +46169,67 @@ ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": false, + "release_date": "2025-08-20", + "last_updated": "2025-08-20", "cost": { - "input": 0.02, - "output": 0.02 - }, - "type": "chat" + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } }, { - "id": "meta/llama-3.2-1b-instruct", - "name": "Llama 3.2 1B Instruct", - "display_name": "Llama 3.2 1B Instruct", + "id": "gemini-3-flash", + "name": "Gemini 3 Flash", + "display_name": "Gemini 3 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.01, - "output": 0.01 - }, - "type": "chat" - } - ] - }, - "requesty": { - "id": "requesty", - "name": "Requesty", - "display_name": "Requesty", - "api": "https://router.requesty.ai/v1", - "doc": "https://requesty.ai/solution/llm-routing/models", - "models": [ + "input": 0.5, + "output": 3, + "cache_read": 0.05 + } + }, { - "id": "xai/grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", "modalities": { "input": [ "text", @@ -48236,10 +46240,10 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -48247,21 +46251,19 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-09", - "last_updated": "2025-09-09", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75, - "cache_write": 3 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.125 + } }, { - "id": "xai/grok-4-fast", - "name": "Grok 4 Fast", - "display_name": "Grok 4 Fast", + "id": "minimax-m2.1-free", + "name": "MiniMax M2.1 Free", + "display_name": "MiniMax M2.1 Free", "modalities": { "input": [ "text" @@ -48271,8 +46273,8 @@ ] }, "limit": { - "context": 2000000, - "output": 64000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -48280,38 +46282,34 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, + "attachment": false, + "open_weights": true, "knowledge": "2025-01", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05, - "cache_write": 0.2 - }, - "type": "chat" + "input": 0, + "output": 0, + "cache_read": 0 + } }, { - "id": "google/gemini-3-flash-preview", - "name": "Gemini 3 Flash", - "display_name": "Gemini 3 Flash", + "id": "kimi-k2.5-free", + "name": "Kimi K2.5 Free", + "display_name": "Kimi K2.5 Free", "modalities": { "input": [ "text", "image", - "audio", - "video", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -48320,28 +46318,24 @@ "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "cache_write": 1 - }, - "type": "chat" + "input": 0, + "output": 0, + "cache_read": 0 + } }, { - "id": "google/gemini-3-pro-preview", - "name": "Gemini 3 Pro", - "display_name": "Gemini 3 Pro", + "id": "claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -48349,8 +46343,8 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -48360,38 +46354,40 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", - "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "cache_write": 4.5 - }, - "type": "chat" + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5 + } + } }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -48399,36 +46395,30 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.55 - }, - "type": "chat" + "input": 1.07, + "output": 8.5, + "cache_read": 0.107 + } }, { - "id": "google/gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "minimax-m2.1", + "name": "MiniMax M2.1", + "display_name": "MiniMax M2.1", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -48436,23 +46426,21 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, + "attachment": false, + "open_weights": true, "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31, - "cache_write": 2.375 - }, - "type": "chat" + "input": 0.3, + "output": 1.2, + "cache_read": 0.1 + } }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT-4.1 Mini", - "display_name": "GPT-4.1 Mini", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", @@ -48463,30 +46451,70 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 1.75, + "output": 14, + "cache_read": 0.175 + } + } + ] + }, + "fastrouter": { + "id": "fastrouter", + "name": "FastRouter", + "display_name": "FastRouter", + "api": "https://go.fastrouter.ai/api/v1", + "doc": "https://fastrouter.ai/models", + "models": [ + { + "id": "moonshotai/kimi-k2", + "name": "Kimi K2", + "display_name": "Kimi K2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] }, - "type": "chat" + "limit": { + "context": 131072, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-11", + "last_updated": "2025-07-11", + "cost": { + "input": 0.55, + "output": 2.2 + } }, { - "id": "openai/gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "x-ai/grok-4", + "name": "Grok 4", + "display_name": "Grok 4", "modalities": { "input": [ "text" @@ -48496,77 +46524,79 @@ ] }, "limit": { - "context": 16000, - "output": 4000 + "context": 256000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-07", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.01 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.75, + "cache_write": 15 + } }, { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 - }, - "type": "chat" + "input": 0.3, + "output": 2.5, + "cache_read": 0.0375 + } }, { - "id": "openai/o4-mini", - "name": "o4 Mini", - "display_name": "o4 Mini", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -48576,20 +46606,19 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.31 + } }, { - "id": "openai/gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "openai/gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ "text", @@ -48600,10 +46629,10 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 400000, + "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -48611,20 +46640,19 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", + "knowledge": "2024-10-01", "release_date": "2025-08-07", "last_updated": "2025-08-07", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.03 - }, - "type": "chat" + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 + } }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o Mini", - "display_name": "GPT-4o Mini", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ "text", @@ -48635,8 +46663,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -48645,38 +46673,33 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 - }, - "type": "chat" + "input": 2, + "output": 8, + "cache_read": 0.5 + } }, { - "id": "openai/gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "openai/gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ "text", - "audio", - "image", - "video" + "image" ], "output": [ - "text", - "audio", - "image" + "text" ] }, "limit": { "context": 400000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -48684,33 +46707,30 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", + "knowledge": "2024-10-01", "release_date": "2025-08-07", "last_updated": "2025-08-07", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 - }, - "type": "chat" + "input": 0.25, + "output": 2, + "cache_read": 0.025 + } }, { - "id": "anthropic/claude-opus-4", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -48718,36 +46738,30 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" + "input": 0.05, + "output": 0.2 + } }, { - "id": "anthropic/claude-opus-4-1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -48755,36 +46769,31 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", + "attachment": false, + "open_weights": true, "release_date": "2025-08-05", "last_updated": "2025-08-05", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" + "input": 0.15, + "output": 0.6 + } }, { - "id": "anthropic/claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 62000 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -48794,58 +46803,50 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-01", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2024-10-01", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.125 + } }, { - "id": "anthropic/claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "qwen/qwen3-coder", + "name": "Qwen3 Coder", + "display_name": "Qwen3 Coder", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 66536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 - }, - "type": "chat" + "input": 0.3, + "output": 1.2 + } }, { - "id": "anthropic/claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "anthropic/claude-opus-4.1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ "text", @@ -48857,8 +46858,8 @@ ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -48868,21 +46869,20 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } }, { - "id": "anthropic/claude-3-7-sonnet", - "name": "Claude Sonnet 3.7", - "display_name": "Claude Sonnet 3.7", + "id": "anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ "text", @@ -48905,67 +46905,61 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-01", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { "input": 3, "output": 15, "cache_read": 0.3, "cache_write": 3.75 - }, - "type": "chat" + } }, { - "id": "anthropic/claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "deepseek-ai/deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-01-23", + "last_updated": "2025-01-23", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0.03, + "output": 0.14 + } } ] }, - "morph": { - "id": "morph", - "name": "Morph", - "display_name": "Morph", - "api": "https://api.morphllm.com/v1", - "doc": "https://docs.morphllm.com/api-reference/introduction", + "minimax": { + "id": "minimax", + "name": "MiniMax (minimax.io)", + "display_name": "MiniMax (minimax.io)", + "api": "https://api.minimax.io/anthropic/v1", + "doc": "https://platform.minimax.io/docs/guides/quickstart", "models": [ { - "id": "morph-v3-large", - "name": "Morph v3 Large", - "display_name": "Morph v3 Large", + "id": "MiniMax-M2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ "text" @@ -48975,28 +46969,28 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 196608, + "output": 128000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "open_weights": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 0.9, - "output": 1.9 - }, - "type": "chat" + "input": 0.3, + "output": 1.2 + } }, { - "id": "auto", - "name": "Auto", - "display_name": "Auto", + "id": "MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" @@ -49006,28 +47000,36 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 204800, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.85, - "output": 1.55 - }, - "type": "chat" - }, + "input": 0.3, + "output": 1.2 + } + } + ] + }, + "google": { + "id": "google", + "name": "google", + "display_name": "google", + "doc": "https://ai.google.dev/gemini-api/docs/pricing", + "models": [ { - "id": "morph-v3-fast", - "name": "Morph v3 Fast", - "display_name": "Morph v3 Fast", + "id": "gemini-embedding-001", + "name": "Gemini Embedding 001", + "display_name": "Gemini Embedding 001", "modalities": { "input": [ "text" @@ -49037,8 +47039,8 @@ ] }, "limit": { - "context": 16000, - "output": 16000 + "context": 2048, + "output": 3072 }, "temperature": false, "tool_call": false, @@ -49047,38 +47049,33 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "knowledge": "2025-05", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 0.8, - "output": 1.2 - }, - "type": "chat" - } - ] - }, - "lmstudio": { - "id": "lmstudio", - "name": "LMStudio", - "display_name": "LMStudio", - "api": "http://127.0.0.1:1234/v1", - "doc": "https://lmstudio.ai/models", - "models": [ + "input": 0.15, + "output": 0 + } + }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -49086,462 +47083,560 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "context_over_200k": { + "input": 0.5, + "output": 3, + "cache_read": 0.05 + } + } }, { - "id": "qwen/qwen3-30b-a3b-2507", - "name": "Qwen3 30B A3B 2507", - "display_name": "Qwen3 30B A3B 2507", + "id": "gemini-2.5-flash-image", + "name": "Gemini 2.5 Flash Image", + "display_name": "Gemini 2.5 Flash Image", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-08-26", + "last_updated": "2025-08-26", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.3, + "output": 30, + "cache_read": 0.075 + } }, { - "id": "qwen/qwen3-coder-30b", - "name": "Qwen3 Coder 30B", - "display_name": "Qwen3 Coder 30B", + "id": "gemini-2.5-flash-preview-05-20", + "name": "Gemini 2.5 Flash Preview 05-20", + "display_name": "Gemini 2.5 Flash Preview 05-20", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 1048576, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - } - ] - }, - "friendli": { - "id": "friendli", - "name": "Friendli", - "display_name": "Friendli", - "api": "https://api.friendli.ai/serverless/v1", - "doc": "https://friendli.ai/docs/guides/serverless_endpoints/introduction", - "models": [ + "input": 0.15, + "output": 0.6, + "cache_read": 0.0375 + } + }, { - "id": "meta-llama-3.3-70b-instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "gemini-flash-lite-latest", + "name": "Gemini Flash-Lite Latest", + "display_name": "Gemini Flash-Lite Latest", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-08-01", - "last_updated": "2025-12-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.6, - "output": 0.6 - }, - "type": "chat" + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + } }, { - "id": "meta-llama-3.1-8b-instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8000 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-08-01", - "last_updated": "2025-12-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.1, - "output": 0.1 - }, - "type": "chat" + "input": 2, + "output": 12, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } + } }, { - "id": "LGAI-EXAONE/EXAONE-4.0.1-32B", - "name": "EXAONE 4.0.1 32B", - "display_name": "EXAONE 4.0.1 32B", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": -1, + "min": 0, + "max": 24576 + } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-31", - "last_updated": "2025-12-23", - "cost": { - "input": 0.6, - "output": 1 + "search": { + "supported": true, + "default": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "input_audio": 1 + } }, { - "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct", - "name": "Llama 4 Maverick 17B 128E Instruct", - "display_name": "Llama 4 Maverick 17B 128E Instruct", + "id": "gemini-flash-latest", + "name": "Gemini Flash Latest", + "display_name": "Gemini Flash Latest", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8000 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-06-16", - "last_updated": "2025-12-23", - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "input_audio": 1 + } }, { - "id": "meta-llama/Llama-4-Scout-17B-16E-Instruct", - "name": "Llama 4 Scout 17B 16E Instruct", - "display_name": "Llama 4 Scout 17B 16E Instruct", + "id": "gemini-2.5-pro-preview-05-06", + "name": "Gemini 2.5 Pro Preview 05-06", + "display_name": "Gemini 2.5 Pro Preview 05-06", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8000 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-06-16", - "last_updated": "2025-12-23", - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-05-06", + "last_updated": "2025-05-06", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.31 + } }, { - "id": "Qwen/Qwen3-30B-A3B", - "name": "Qwen3 30B A3B", - "display_name": "Qwen3 30B A3B", + "id": "gemini-2.5-flash-preview-tts", + "name": "Gemini 2.5 Flash Preview TTS", + "display_name": "Gemini 2.5 Flash Preview TTS", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 131072, - "output": 8000 + "context": 8000, + "output": 16000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-06-16", - "last_updated": "2025-12-23", - "type": "chat" + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-05-01", + "last_updated": "2025-05-01", + "cost": { + "input": 0.5, + "output": 10 + } }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "gemini-2.0-flash-lite", + "name": "Gemini 2.0 Flash Lite", + "display_name": "Gemini 2.0 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1048576, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-29", - "last_updated": "2025-12-23", - "cost": { - "input": 0.2, - "output": 0.8 + "search": { + "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "cost": { + "input": 0.075, + "output": 0.3 + } }, { - "id": "Qwen/Qwen3-32B", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "gemini-live-2.5-flash-preview-native-audio", + "name": "Gemini Live 2.5 Flash Preview Native Audio", + "display_name": "Gemini Live 2.5 Flash Preview Native Audio", "modalities": { "input": [ - "text" + "text", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { "context": 131072, - "output": 8000 + "output": 65536 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-06-16", - "last_updated": "2025-12-23", - "type": "chat" - }, - { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-09-18", + "cost": { + "input": 0.5, + "output": 2, + "input_audio": 3, + "output_audio": 12 + } + }, + { + "id": "gemini-2.0-flash", + "name": "Gemini 2.0 Flash", + "display_name": "Gemini 2.0 Flash", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1048576, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-29", - "last_updated": "2025-12-23", - "type": "chat" + "search": { + "supported": true, + "default": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + } }, { - "id": "zai-org/GLM-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": -1, + "min": 512, + "max": 24576 + } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-10-31", - "last_updated": "2025-12-23", - "type": "chat" + "search": { + "supported": true, + "default": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + } }, { - "id": "deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek R1 0528", - "display_name": "DeepSeek R1 0528", + "id": "gemini-2.5-pro-preview-06-05", + "name": "Gemini 2.5 Pro Preview 06-05", + "display_name": "Gemini 2.5 Pro Preview 06-05", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-11", - "last_updated": "2025-12-23", - "type": "chat" - } - ] - }, - "sap-ai-core": { - "id": "sap-ai-core", - "name": "SAP AI Core", - "display_name": "SAP AI Core", - "doc": "https://help.sap.com/docs/sap-ai-core", - "models": [ + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-05", + "last_updated": "2025-06-05", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.31 + } + }, { - "id": "anthropic--claude-3.5-sonnet", - "name": "anthropic--claude-3.5-sonnet", - "display_name": "anthropic--claude-3.5-sonnet", + "id": "gemini-live-2.5-flash", + "name": "Gemini Live 2.5 Flash", + "display_name": "Gemini Live 2.5 Flash", "modalities": { "input": [ "text", "image", - "pdf" + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 128000, + "output": 8000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2025-01", + "release_date": "2025-09-01", + "last_updated": "2025-09-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0.5, + "output": 2, + "input_audio": 3, + "output_audio": 12 + } }, { - "id": "anthropic--claude-4.5-haiku", - "name": "anthropic--claude-4.5-haiku", - "display_name": "anthropic--claude-4.5-haiku", + "id": "gemini-2.5-flash-lite-preview-06-17", + "name": "Gemini 2.5 Flash Lite Preview 06-17", + "display_name": "Gemini 2.5 Flash Lite Preview 06-17", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -49549,8 +47644,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -49560,65 +47655,58 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-01", - "last_updated": "2025-10-01", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 - }, - "type": "chat" + "input": 0.1, + "output": 0.4, + "cache_read": 0.025, + "input_audio": 0.3 + } }, { - "id": "anthropic--claude-4-opus", - "name": "anthropic--claude-4-opus", - "display_name": "anthropic--claude-4-opus", + "id": "gemini-2.5-flash-image-preview", + "name": "Gemini 2.5 Flash Image Preview", + "display_name": "Gemini 2.5 Flash Image Preview", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-06", + "release_date": "2025-08-26", + "last_updated": "2025-08-26", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" + "input": 0.3, + "output": 30, + "cache_read": 0.075 + } }, { - "id": "gemini-2.5-flash", - "name": "gemini-2.5-flash", - "display_name": "gemini-2.5-flash", + "id": "gemini-2.5-flash-preview-09-2025", + "name": "Gemini 2.5 Flash Preview 09 2025", + "display_name": "Gemini 2.5 Flash Preview 09 2025", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" @@ -49632,29 +47720,39 @@ "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": -1, + "min": 0, + "max": 24576 + } + }, + "search": { + "supported": true, + "default": false }, "attachment": true, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-03-25", - "last_updated": "2025-06-05", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { "input": 0.3, "output": 2.5, "cache_read": 0.075, "input_audio": 1 - }, - "type": "chat" + } }, { - "id": "anthropic--claude-3-haiku", - "name": "anthropic--claude-3-haiku", - "display_name": "anthropic--claude-3-haiku", + "id": "gemini-2.5-flash-preview-04-17", + "name": "Gemini 2.5 Flash Preview 04-17", + "display_name": "Gemini 2.5 Flash Preview 04-17", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -49662,67 +47760,61 @@ ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-13", - "last_updated": "2024-03-13", + "knowledge": "2025-01", + "release_date": "2025-04-17", + "last_updated": "2025-04-17", "cost": { - "input": 0.25, - "output": 1.25, - "cache_read": 0.03, - "cache_write": 0.3 - }, - "type": "chat" + "input": 0.15, + "output": 0.6, + "cache_read": 0.0375 + } }, { - "id": "anthropic--claude-3-sonnet", - "name": "anthropic--claude-3-sonnet", - "display_name": "anthropic--claude-3-sonnet", + "id": "gemini-2.5-pro-preview-tts", + "name": "Gemini 2.5 Pro Preview TTS", + "display_name": "Gemini 2.5 Pro Preview TTS", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 8000, + "output": 16000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-04", - "last_updated": "2024-03-04", + "knowledge": "2025-01", + "release_date": "2025-05-01", + "last_updated": "2025-05-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 0.3 - }, - "type": "chat" + "input": 1, + "output": 20 + } }, { - "id": "gpt-5-nano", - "name": "gpt-5-nano", - "display_name": "gpt-5-nano", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", @@ -49733,265 +47825,271 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": -1, + "min": 128, + "max": 32768 + } + }, + "search": { + "supported": true, + "default": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.01 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.31 + } }, { - "id": "anthropic--claude-3.7-sonnet", - "name": "anthropic--claude-3.7-sonnet", - "display_name": "anthropic--claude-3.7-sonnet", + "id": "gemini-1.5-flash", + "name": "Gemini 1.5 Flash", + "display_name": "Gemini 1.5 Flash", "modalities": { "input": [ "text", "image", - "pdf" + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-02-24", - "last_updated": "2025-02-24", + "knowledge": "2024-04", + "release_date": "2024-05-14", + "last_updated": "2024-05-14", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0.075, + "output": 0.3, + "cache_read": 0.01875 + } }, { - "id": "gpt-5-mini", - "name": "gpt-5-mini", - "display_name": "gpt-5-mini", + "id": "gemini-1.5-flash-8b", + "name": "Gemini 1.5 Flash-8B", + "display_name": "Gemini 1.5 Flash-8B", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-04", + "release_date": "2024-10-03", + "last_updated": "2024-10-03", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.03 - }, - "type": "chat" + "input": 0.0375, + "output": 0.15, + "cache_read": 0.01 + } }, { - "id": "anthropic--claude-4.5-sonnet", - "name": "anthropic--claude-4.5-sonnet", - "display_name": "anthropic--claude-4.5-sonnet", + "id": "gemini-2.5-flash-lite-preview-09-2025", + "name": "Gemini 2.5 Flash Lite Preview 09 2025", + "display_name": "Gemini 2.5 Flash Lite Preview 09 2025", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": -1, + "min": 512, + "max": 24576 + } + }, + "search": { + "supported": true, + "default": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + } }, { - "id": "gemini-2.5-pro", - "name": "gemini-2.5-pro", - "display_name": "gemini-2.5-pro", + "id": "gemini-1.5-pro", + "name": "Gemini 1.5 Pro", + "display_name": "Gemini 1.5 Pro", "modalities": { "input": [ "text", "image", "audio", - "video", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-25", - "last_updated": "2025-06-05", + "knowledge": "2024-04", + "release_date": "2024-02-15", + "last_updated": "2024-02-15", "cost": { "input": 1.25, - "output": 10, - "cache_read": 0.31 - }, - "type": "chat" + "output": 5, + "cache_read": 0.3125 + } }, { - "id": "anthropic--claude-3-opus", - "name": "anthropic--claude-3-opus", - "display_name": "anthropic--claude-3-opus", + "id": "gemini-2.0-flash-preview-image-generation", + "name": "Gemini 2.0 Flash Preview Image Generation", + "display_name": "Gemini 2.0 Flash Preview Image Generation", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 32000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-02-29", - "last_updated": "2024-02-29", - "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "search": { + "supported": false }, - "type": "chat" - }, + "attachment": true + } + ] + }, + "google-vertex": { + "id": "google-vertex", + "name": "Vertex", + "display_name": "Vertex", + "doc": "https://cloud.google.com/vertex-ai/generative-ai/docs/models", + "models": [ { - "id": "anthropic--claude-4-sonnet", - "name": "anthropic--claude-4-sonnet", - "display_name": "anthropic--claude-4-sonnet", + "id": "gemini-embedding-001", + "name": "Gemini Embedding 001", + "display_name": "Gemini Embedding 001", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 2048, + "output": 3072 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-05", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0.15, + "output": 0 + } }, { - "id": "gpt-5", - "name": "gpt-5", - "display_name": "gpt-5", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -49999,32 +48097,30 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 - }, - "type": "chat" - } - ] - }, - "anthropic": { - "id": "anthropic", - "name": "Anthropic", - "display_name": "Anthropic", - "doc": "https://docs.anthropic.com/en/docs/about-claude/models", - "models": [ + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "context_over_200k": { + "input": 0.5, + "output": 3, + "cache_read": 0.05 + } + } + }, { - "id": "claude-opus-4-0", - "name": "Claude Opus 4 (latest)", - "display_name": "Claude Opus 4 (latest)", + "id": "gemini-2.5-flash-preview-05-20", + "name": "Gemini 2.5 Flash Preview 05-20", + "display_name": "Gemini 2.5 Flash Preview 05-20", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -50032,8 +48128,8 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -50043,25 +48139,25 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-01", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" + "input": 0.15, + "output": 0.6, + "cache_read": 0.0375 + } }, { - "id": "claude-3-5-sonnet-20241022", - "name": "Claude Sonnet 3.5 v2", - "display_name": "Claude Sonnet 3.5 v2", + "id": "gemini-flash-lite-latest", + "name": "Gemini Flash-Lite Latest", + "display_name": "Gemini Flash-Lite Latest", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -50069,35 +48165,36 @@ ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + } }, { - "id": "claude-opus-4-1", - "name": "Claude Opus 4.1 (latest)", - "display_name": "Claude Opus 4.1 (latest)", + "id": "gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ "text", "image", + "video", + "audio", "pdf" ], "output": [ @@ -50105,8 +48202,8 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -50116,25 +48213,30 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" + "input": 2, + "output": 12, + "cache_read": 0.2, + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } + } }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5 (latest)", - "display_name": "Claude Haiku 4.5 (latest)", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -50142,8 +48244,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -50153,25 +48255,26 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 - }, - "type": "chat" + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.383 + } }, { - "id": "claude-3-5-sonnet-20240620", - "name": "Claude Sonnet 3.5", - "display_name": "Claude Sonnet 3.5", + "id": "gemini-flash-latest", + "name": "Gemini Flash Latest", + "display_name": "Gemini Flash Latest", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -50179,35 +48282,37 @@ ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-06-20", - "last_updated": "2024-06-20", + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.383 + } }, { - "id": "claude-3-5-haiku-latest", - "name": "Claude Haiku 3.5 (latest)", - "display_name": "Claude Haiku 3.5 (latest)", + "id": "gemini-2.5-pro-preview-05-06", + "name": "Gemini 2.5 Pro Preview 05-06", + "display_name": "Gemini 2.5 Pro Preview 05-06", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -50215,35 +48320,36 @@ ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2025-01", + "release_date": "2025-05-06", + "last_updated": "2025-05-06", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.31 + } }, { - "id": "claude-opus-4-5", - "name": "Claude Opus 4.5 (latest)", - "display_name": "Claude Opus 4.5 (latest)", + "id": "gemini-2.0-flash-lite", + "name": "Gemini 2.0 Flash Lite", + "display_name": "Gemini 2.0 Flash Lite", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -50251,36 +48357,34 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 - }, - "type": "chat" + "input": 0.075, + "output": 0.3 + } }, { - "id": "claude-3-opus-20240229", - "name": "Claude Opus 3", - "display_name": "Claude Opus 3", + "id": "gemini-2.0-flash", + "name": "Gemini 2.0 Flash", + "display_name": "Gemini 2.0 Flash", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -50288,8 +48392,8 @@ ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 1048576, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -50298,25 +48402,25 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-02-29", - "last_updated": "2024-02-29", + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" + "input": 0.15, + "output": 0.6, + "cache_read": 0.025 + } }, { - "id": "claude-opus-4-5-20251101", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -50324,8 +48428,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -50335,25 +48439,25 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-01", - "last_updated": "2025-11-01", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 - }, - "type": "chat" + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + } }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5 (latest)", - "display_name": "Claude Sonnet 4.5 (latest)", + "id": "gemini-2.5-pro-preview-06-05", + "name": "Gemini 2.5 Pro Preview 06-05", + "display_name": "Gemini 2.5 Pro Preview 06-05", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -50361,8 +48465,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -50372,25 +48476,25 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2025-01", + "release_date": "2025-06-05", + "last_updated": "2025-06-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.31 + } }, { - "id": "claude-sonnet-4-5-20250929", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "gemini-2.5-flash-lite-preview-06-17", + "name": "Gemini 2.5 Flash Lite Preview 06-17", + "display_name": "Gemini 2.5 Flash Lite Preview 06-17", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -50398,8 +48502,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 65536, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -50409,25 +48513,25 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + } }, { - "id": "claude-sonnet-4-20250514", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "gemini-2.5-flash-preview-09-2025", + "name": "Gemini 2.5 Flash Preview 09-25", + "display_name": "Gemini 2.5 Flash Preview 09-25", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -50435,8 +48539,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -50446,25 +48550,26 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.383 + } }, { - "id": "claude-opus-4-20250514", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "gemini-2.5-flash-preview-04-17", + "name": "Gemini 2.5 Flash Preview 04-17", + "display_name": "Gemini 2.5 Flash Preview 04-17", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -50472,8 +48577,8 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -50483,25 +48588,25 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-01", + "release_date": "2025-04-17", + "last_updated": "2025-04-17", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" + "input": 0.15, + "output": 0.6, + "cache_read": 0.0375 + } }, { - "id": "claude-3-5-haiku-20241022", - "name": "Claude Haiku 3.5", - "display_name": "Claude Haiku 3.5", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -50509,71 +48614,36 @@ ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", - "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 - }, - "type": "chat" - }, - { - "id": "claude-3-haiku-20240307", - "name": "Claude Haiku 3", - "display_name": "Claude Haiku 3", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 200000, - "output": 4096 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-13", - "last_updated": "2024-03-13", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.25, - "output": 1.25, - "cache_read": 0.03, - "cache_write": 0.3 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.31 + } }, { - "id": "claude-3-7-sonnet-20250219", - "name": "Claude Sonnet 3.7", - "display_name": "Claude Sonnet 3.7", + "id": "gemini-2.5-flash-lite-preview-09-2025", + "name": "Gemini 2.5 Flash Lite Preview 09-25", + "display_name": "Gemini 2.5 Flash Lite Preview 09-25", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -50581,8 +48651,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -50592,34 +48662,30 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + } }, { - "id": "claude-3-7-sonnet-latest", - "name": "Claude Sonnet 3.7 (latest)", - "display_name": "Claude Sonnet 3.7 (latest)", + "id": "openai/gpt-oss-120b-maas", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -50627,36 +48693,30 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0.09, + "output": 0.36 + } }, { - "id": "claude-sonnet-4-0", - "name": "Claude Sonnet 4 (latest)", - "display_name": "Claude Sonnet 4 (latest)", + "id": "openai/gpt-oss-20b-maas", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -50664,36 +48724,30 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0.07, + "output": 0.25 + } }, { - "id": "claude-opus-4-1-20250805", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "zai-org/glm-4.7-maas", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -50701,105 +48755,104 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" - }, + "input": 0.6, + "output": 2.2 + } + } + ] + }, + "inception": { + "id": "inception", + "name": "Inception", + "display_name": "Inception", + "api": "https://api.inceptionlabs.ai/v1/", + "doc": "https://platform.inceptionlabs.ai/docs", + "models": [ { - "id": "claude-3-sonnet-20240229", - "name": "Claude Sonnet 3", - "display_name": "Claude Sonnet 3", + "id": "mercury-coder", + "name": "Mercury Coder", + "display_name": "Mercury Coder", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-04", - "last_updated": "2024-03-04", + "knowledge": "2023-10", + "release_date": "2025-02-26", + "last_updated": "2025-07-31", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 0.3 - }, - "type": "chat" + "input": 0.25, + "output": 1, + "cache_read": 0.25, + "cache_write": 1 + } }, { - "id": "claude-haiku-4-5-20251001", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "mercury", + "name": "Mercury", + "display_name": "Mercury", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2023-10", + "release_date": "2025-06-26", + "last_updated": "2025-07-31", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 - }, - "type": "chat" + "input": 0.25, + "output": 1, + "cache_read": 0.25, + "cache_write": 1 + } } ] }, - "fireworks-ai": { - "id": "fireworks-ai", - "name": "Fireworks AI", - "display_name": "Fireworks AI", - "api": "https://api.fireworks.ai/inference/v1/", - "doc": "https://fireworks.ai/docs/", + "wandb": { + "id": "wandb", + "name": "Weights & Biases", + "display_name": "Weights & Biases", + "api": "https://api.inference.wandb.ai/v1", + "doc": "https://weave-docs.wandb.ai/guides/integrations/inference/", "models": [ { - "id": "accounts/fireworks/models/deepseek-r1-0528", - "name": "Deepseek R1 05/28", - "display_name": "Deepseek R1 05/28", + "id": "moonshotai/Kimi-K2-Instruct", + "name": "Kimi-K2-Instruct", + "display_name": "Kimi-K2-Instruct", "modalities": { "input": [ "text" @@ -50809,30 +48862,28 @@ ] }, "limit": { - "context": 160000, + "context": 128000, "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "knowledge": "2024-10", + "release_date": "2025-07-14", + "last_updated": "2025-07-14", "cost": { - "input": 3, - "output": 8 - }, - "type": "chat" + "input": 1.35, + "output": 4 + } }, { - "id": "accounts/fireworks/models/deepseek-v3p1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "microsoft/Phi-4-mini-instruct", + "name": "Phi-4-mini-instruct", + "display_name": "Phi-4-mini-instruct", "modalities": { "input": [ "text" @@ -50842,8 +48893,8 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -50853,19 +48904,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.56, - "output": 1.68 - }, - "type": "chat" + "input": 0.08, + "output": 0.35 + } }, { - "id": "accounts/fireworks/models/deepseek-v3p2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "meta-llama/Llama-3.1-8B-Instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "display_name": "Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ "text" @@ -50875,8 +48925,8 @@ ] }, "limit": { - "context": 160000, - "output": 160000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -50886,20 +48936,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-09", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.56, - "output": 1.68, - "cache_read": 0.28 - }, - "type": "chat" + "input": 0.22, + "output": 0.22 + } }, { - "id": "accounts/fireworks/models/minimax-m2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -50909,8 +48957,8 @@ ] }, "limit": { - "context": 192000, - "output": 192000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -50920,31 +48968,30 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-11", - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.15 - }, - "type": "chat" + "input": 0.71, + "output": 0.71 + } }, { - "id": "accounts/fireworks/models/minimax-m2p1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "meta-llama/Llama-4-Scout-17B-16E-Instruct", + "name": "Llama 4 Scout 17B 16E Instruct", + "display_name": "Llama 4 Scout 17B 16E Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 64000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -50954,19 +49001,18 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "knowledge": "2024-12", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.15 - }, - "type": "chat" + "input": 0.17, + "output": 0.66 + } }, { - "id": "accounts/fireworks/models/glm-4p7", - "name": "GLM 4.7", - "display_name": "GLM 4.7", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -50976,31 +49022,28 @@ ] }, "limit": { - "context": 198000, - "output": 198000 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2025-04-28", + "last_updated": "2025-07-21", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.3 - }, - "type": "chat" + "input": 0.1, + "output": 0.1 + } }, { - "id": "accounts/fireworks/models/deepseek-v3-0324", - "name": "Deepseek V3 03-24", - "display_name": "Deepseek V3 03-24", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen3-Coder-480B-A35B-Instruct", + "display_name": "Qwen3-Coder-480B-A35B-Instruct", "modalities": { "input": [ "text" @@ -51010,8 +49053,8 @@ ] }, "limit": { - "context": 160000, - "output": 16384 + "context": 262144, + "output": 66536 }, "temperature": true, "tool_call": true, @@ -51020,19 +49063,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.9, - "output": 0.9 - }, - "type": "chat" + "input": 1, + "output": 1.5 + } }, { - "id": "accounts/fireworks/models/glm-4p6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3-235B-A22B-Thinking-2507", + "display_name": "Qwen3-235B-A22B-Thinking-2507", "modalities": { "input": [ "text" @@ -51042,8 +49084,8 @@ ] }, "limit": { - "context": 198000, - "output": 198000 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -51054,19 +49096,17 @@ "attachment": false, "open_weights": true, "knowledge": "2025-04", - "release_date": "2025-10-01", - "last_updated": "2025-10-01", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 0.55, - "output": 2.19, - "cache_read": 0.28 - }, - "type": "chat" + "input": 0.1, + "output": 0.1 + } }, { - "id": "accounts/fireworks/models/kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ "text" @@ -51076,8 +49116,8 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 161000, + "output": 163840 }, "temperature": true, "tool_call": true, @@ -51087,18 +49127,18 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "knowledge": "2025-05", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.6, - "output": 2.5 - }, - "type": "chat" + "input": 1.35, + "output": 5.4 + } }, { - "id": "accounts/fireworks/models/kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "deepseek-ai/DeepSeek-V3-0324", + "name": "DeepSeek-V3-0324", + "display_name": "DeepSeek-V3-0324", "modalities": { "input": [ "text" @@ -51108,8 +49148,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 161000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -51119,18 +49159,26 @@ "attachment": false, "open_weights": true, "knowledge": "2024-10", - "release_date": "2025-07-11", - "last_updated": "2025-07-11", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 1, - "output": 3 - }, - "type": "chat" - }, + "input": 1.14, + "output": 2.75 + } + } + ] + }, + "cloudflare-ai-gateway": { + "id": "cloudflare-ai-gateway", + "name": "Cloudflare AI Gateway", + "display_name": "Cloudflare AI Gateway", + "api": "https://gateway.ai.cloudflare.com/v1/${CLOUDFLARE_ACCOUNT_ID}/${CLOUDFLARE_GATEWAY_ID}/compat/", + "doc": "https://developers.cloudflare.com/ai-gateway/", + "models": [ { - "id": "accounts/fireworks/models/qwen3-235b-a22b", - "name": "Qwen3 235B-A22B", - "display_name": "Qwen3 235B-A22B", + "id": "openai/gpt-4", + "name": "GPT-4", + "display_name": "GPT-4", "modalities": { "input": [ "text" @@ -51140,62 +49188,62 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "attachment": true, + "open_weights": false, + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 0.22, - "output": 0.88 - }, - "type": "chat" + "input": 30, + "output": 60 + } }, { - "id": "accounts/fireworks/models/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "openai/gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.05, - "output": 0.2 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.125 + } }, { - "id": "accounts/fireworks/models/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "openai/gpt-3.5-turbo", + "name": "GPT-3.5-turbo", + "display_name": "GPT-3.5-turbo", "modalities": { "input": [ "text" @@ -51205,62 +49253,61 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 16385, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "knowledge": "2021-09-01", + "release_date": "2023-03-01", + "last_updated": "2023-11-06", "cost": { - "input": 0.15, - "output": 0.6 - }, - "type": "chat" + "input": 0.5, + "output": 1.5, + "cache_read": 1.25 + } }, { - "id": "accounts/fireworks/models/glm-4p5-air", - "name": "GLM 4.5 Air", - "display_name": "GLM 4.5 Air", + "id": "openai/gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-01", - "last_updated": "2025-08-01", + "attachment": true, + "open_weights": false, + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 0.22, - "output": 0.88 - }, - "type": "chat" + "input": 10, + "output": 30 + } }, { - "id": "accounts/fireworks/models/qwen3-coder-480b-a35b-instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "openai/o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ "text" @@ -51270,244 +49317,236 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-07-22", - "last_updated": "2025-07-22", + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 0.45, - "output": 1.8 - }, - "type": "chat" + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + } }, { - "id": "accounts/fireworks/models/glm-4p5", - "name": "GLM 4.5", - "display_name": "GLM 4.5", + "id": "openai/gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.55, - "output": 2.19 - }, - "type": "chat" - } - ] - }, - "io-net": { - "id": "io-net", - "name": "IO.NET", - "display_name": "IO.NET", - "api": "https://api.intelligence.io.solutions/api/v1", - "doc": "https://io.net/docs/guides/intelligence/io-intelligence", - "models": [ + "input": 1.25, + "output": 10, + "cache_read": 0.13 + } + }, { - "id": "moonshotai/Kimi-K2-Instruct-0905", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 4096 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-09-05", - "last_updated": "2024-09-05", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "cost": { - "input": 0.39, - "output": 1.9, - "cache_read": 0.195, - "cache_write": 0.78 - }, - "type": "chat" + "input": 2.5, + "output": 10, + "cache_read": 1.25 + } }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "openai/o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 4096 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.55, - "output": 2.25, - "cache_read": 0.275, - "cache_write": 1.1 - }, - "type": "chat" + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 + } }, { - "id": "openai/gpt-oss-20b", - "name": "GPT-OSS 20B", - "display_name": "GPT-OSS 20B", + "id": "openai/o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 4096 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 0.03, - "output": 0.14, - "cache_read": 0.015, - "cache_write": 0.06 - }, - "type": "chat" + "input": 15, + "output": 60, + "cache_read": 7.5 + } }, { - "id": "openai/gpt-oss-120b", - "name": "GPT-OSS 120B", - "display_name": "GPT-OSS 120B", + "id": "openai/o3-pro", + "name": "o3-pro", + "display_name": "o3-pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 4096 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-06-10", + "last_updated": "2025-06-10", "cost": { - "input": 0.04, - "output": 0.4, - "cache_read": 0.02, - "cache_write": 0.08 - }, - "type": "chat" + "input": 20, + "output": 80 + } }, { - "id": "mistralai/Devstral-Small-2505", - "name": "Devstral Small 2505", - "display_name": "Devstral Small 2505", + "id": "openai/o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-05-01", - "last_updated": "2025-05-01", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.05, - "output": 0.22, - "cache_read": 0.025, - "cache_write": 0.1 - }, - "type": "chat" + "input": 2, + "output": 8, + "cache_read": 0.5 + } }, { - "id": "mistralai/Mistral-Nemo-Instruct-2407", - "name": "Mistral Nemo Instruct 2407", - "display_name": "Mistral Nemo Instruct 2407", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -51515,213 +49554,224 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-05", - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.02, - "output": 0.04, - "cache_read": 0.01, - "cache_write": 0.04 - }, - "type": "chat" + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 + } }, { - "id": "mistralai/Magistral-Small-2506", - "name": "Magistral Small 2506", - "display_name": "Magistral Small 2506", + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-01", - "last_updated": "2025-06-01", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.5, - "output": 1.5, - "cache_read": 0.25, - "cache_write": 1 - }, - "type": "chat" + "input": 1.75, + "output": 14, + "cache_read": 0.175 + } }, { - "id": "mistralai/Mistral-Large-Instruct-2411", - "name": "Mistral Large Instruct 2411", - "display_name": "Mistral Large Instruct 2411", + "id": "anthropic/claude-opus-4", + "name": "Claude Opus 4 (latest)", + "display_name": "Claude Opus 4 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 2, - "output": 6, - "cache_read": 1, - "cache_write": 4 - }, - "type": "chat" + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } }, { - "id": "meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "anthropic/claude-opus-4-1", + "name": "Claude Opus 4.1 (latest)", + "display_name": "Claude Opus 4.1 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.13, - "output": 0.38, - "cache_read": 0.065, - "cache_write": 0.26 - }, - "type": "chat" - }, - { - "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", - "name": "Llama 4 Maverick 17B 128E Instruct", - "display_name": "Llama 4 Maverick 17B 128E Instruct", + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } + }, + { + "id": "anthropic/claude-haiku-4-5", + "name": "Claude Haiku 4.5 (latest)", + "display_name": "Claude Haiku 4.5 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 430000, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-15", - "last_updated": "2025-01-15", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075, - "cache_write": 0.3 - }, - "type": "chat" + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 + } }, { - "id": "meta-llama/Llama-3.2-90B-Vision-Instruct", - "name": "Llama 3.2 90B Vision Instruct", - "display_name": "Llama 3.2 90B Vision Instruct", + "id": "anthropic/claude-opus-4-6", + "name": "Claude Opus 4.6 (latest)", + "display_name": "Claude Opus 4.6 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.35, - "output": 0.4, - "cache_read": 0.175, - "cache_write": 0.7 - }, - "type": "chat" + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25, + "context_over_200k": { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5 + } + } }, { - "id": "Intel/Qwen3-Coder-480B-A35B-Instruct-int4-mixed-ar", - "name": "Qwen 3 Coder 480B", - "display_name": "Qwen 3 Coder 480B", + "id": "anthropic/claude-3-haiku", + "name": "Claude Haiku 3", + "display_name": "Claude Haiku 3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 106000, + "context": 200000, "output": 4096 }, "temperature": true, @@ -51729,130 +49779,134 @@ "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-15", - "last_updated": "2025-01-15", + "attachment": true, + "open_weights": false, + "knowledge": "2023-08-31", + "release_date": "2024-03-13", + "last_updated": "2024-03-13", "cost": { - "input": 0.22, - "output": 0.95, - "cache_read": 0.11, - "cache_write": 0.44 - }, - "type": "chat" + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 + } }, { - "id": "Qwen/Qwen2.5-VL-32B-Instruct", - "name": "Qwen 2.5 VL 32B Instruct", - "display_name": "Qwen 2.5 VL 32B Instruct", + "id": "anthropic/claude-opus-4-5", + "name": "Claude Opus 4.5 (latest)", + "display_name": "Claude Opus 4.5 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-09", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.05, - "output": 0.22, - "cache_read": 0.025, - "cache_write": 0.1 - }, - "type": "chat" + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + } }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen 3 235B Thinking", - "display_name": "Qwen 3 235B Thinking", + "id": "anthropic/claude-3-opus", + "name": "Claude Opus 3", + "display_name": "Claude Opus 3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 200000, "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "attachment": true, + "open_weights": false, + "knowledge": "2023-08-31", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", "cost": { - "input": 0.11, - "output": 0.6, - "cache_read": 0.055, - "cache_write": 0.22 - }, - "type": "chat" + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "name": "Qwen 3 Next 80B Instruct", - "display_name": "Qwen 3 Next 80B Instruct", + "id": "anthropic/claude-sonnet-4-5", + "name": "Claude Sonnet 4.5 (latest)", + "display_name": "Claude Sonnet 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-10", - "last_updated": "2025-01-10", + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.1, - "output": 0.8, - "cache_read": 0.05, - "cache_write": 0.2 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "zai-org/GLM-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "anthropic/claude-3.5-sonnet", + "name": "Claude Sonnet 3.5 v2", + "display_name": "Claude Sonnet 3.5 v2", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -51860,151 +49914,147 @@ }, "limit": { "context": 200000, - "output": 4096 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-11-15", - "last_updated": "2024-11-15", + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.4, - "output": 1.75, - "cache_read": 0.2, - "cache_write": 0.8 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", + "id": "anthropic/claude-3-sonnet", + "name": "Claude Sonnet 3", + "display_name": "Claude Sonnet 3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 200000, "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-05-28", + "attachment": true, + "open_weights": false, + "knowledge": "2023-08-31", + "release_date": "2024-03-04", + "last_updated": "2024-03-04", "cost": { - "input": 2, - "output": 8.75, - "cache_read": 1, - "cache_write": 4 - }, - "type": "chat" - } - ] - }, - "modelscope": { - "id": "modelscope", - "name": "ModelScope", - "display_name": "ModelScope", - "api": "https://api-inference.modelscope.cn/v1", - "doc": "https://modelscope.cn/docs/model-service/API-Inference/intro", - "models": [ + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 0.3 + } + }, { - "id": "ZhipuAI/GLM-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "anthropic/claude-3-5-haiku", + "name": "Claude Haiku 3.5 (latest)", + "display_name": "Claude Haiku 3.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 + } }, { - "id": "ZhipuAI/GLM-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "anthropic/claude-3.5-haiku", + "name": "Claude Haiku 3.5 (latest)", + "display_name": "Claude Haiku 3.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 98304 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "attachment": true, + "open_weights": false, + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 + } }, { - "id": "Qwen/Qwen3-30B-A3B-Thinking-2507", - "name": "Qwen3 30B A3B Thinking 2507", - "display_name": "Qwen3 30B A3B Thinking 2507", + "id": "anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4 (latest)", + "display_name": "Claude Sonnet 4 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -52012,53 +50062,63 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - }, + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } + } + ] + }, + "openai": { + "id": "openai", + "name": "OpenAI", + "display_name": "OpenAI", + "doc": "https://platform.openai.com/docs/models", + "models": [ { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04-28", - "last_updated": "2025-07-21", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 + } }, { - "id": "Qwen/Qwen3-Coder-30B-A3B-Instruct", - "name": "Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen3 Coder 30B A3B Instruct", + "id": "text-embedding-3-small", + "name": "text-embedding-3-small", + "display_name": "text-embedding-3-small", "modalities": { "input": [ "text" @@ -52068,29 +50128,28 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 8191, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-31", - "last_updated": "2025-07-31", + "open_weights": false, + "knowledge": "2024-01", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 0, + "input": 0.02, "output": 0 - }, - "type": "chat" + } }, { - "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "name": "Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen3 30B A3B Instruct 2507", + "id": "gpt-4", + "name": "GPT-4", + "display_name": "GPT-4", "modalities": { "input": [ "text" @@ -52100,170 +50159,166 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "attachment": true, + "open_weights": false, + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 30, + "output": 60 + } }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3-235B-A22B-Thinking-2507", - "display_name": "Qwen3-235B-A22B-Thinking-2507", + "id": "o1-pro", + "name": "o1-pro", + "display_name": "o1-pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2025-03-19", + "last_updated": "2025-03-19", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - } - ] - }, - "azure-cognitive-services": { - "id": "azure-cognitive-services", - "name": "Azure Cognitive Services", - "display_name": "Azure Cognitive Services", - "doc": "https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models", - "models": [ + "input": 150, + "output": 600 + } + }, { - "id": "gpt-3.5-turbo-1106", - "name": "GPT-3.5 Turbo 1106", - "display_name": "GPT-3.5 Turbo 1106", + "id": "gpt-4o-2024-05-13", + "name": "GPT-4o (2024-05-13)", + "display_name": "GPT-4o (2024-05-13)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-11-06", - "last_updated": "2023-11-06", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 1, - "output": 2 - }, - "type": "chat" + "input": 5, + "output": 15 + } }, { - "id": "mistral-small-2503", - "name": "Mistral Small 3.1", - "display_name": "Mistral Small 3.1", + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2025-03-01", - "last_updated": "2025-03-01", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.1, - "output": 0.3 - }, - "type": "chat" + "input": 1.75, + "output": 14, + "cache_read": 0.175 + } }, { - "id": "codestral-2501", - "name": "Codestral 25.01", - "display_name": "Codestral 25.01", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-03", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.3, - "output": 0.9 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.125 + } }, { - "id": "mistral-large-2411", - "name": "Mistral Large 24.11", - "display_name": "Mistral Large 24.11", + "id": "gpt-4o-2024-08-06", + "name": "GPT-4o (2024-08-06)", + "display_name": "GPT-4o (2024-08-06)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -52271,28 +50326,28 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "knowledge": "2023-09", + "release_date": "2024-08-06", + "last_updated": "2024-08-06", "cost": { - "input": 2, - "output": 6 - }, - "type": "chat" + "input": 2.5, + "output": 10, + "cache_read": 1.25 + } }, { - "id": "gpt-5-pro", - "name": "GPT-5 Pro", - "display_name": "GPT-5 Pro", + "id": "gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ "text", @@ -52303,64 +50358,63 @@ ] }, "limit": { - "context": 400000, - "output": 272000 + "context": 1047576, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 15, - "output": 120 - }, - "type": "chat" + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 + } }, { - "id": "deepseek-v3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "o3-deep-research", + "name": "o3-deep-research", + "display_name": "o3-deep-research", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-06-26", + "last_updated": "2024-06-26", "cost": { - "input": 0.28, - "output": 0.42, - "cache_read": 0.028 - }, - "type": "chat" + "input": 10, + "output": 40, + "cache_read": 2.5 + } }, { - "id": "mai-ds-r1", - "name": "MAI-DS-R1", - "display_name": "MAI-DS-R1", + "id": "gpt-3.5-turbo", + "name": "GPT-3.5-turbo", + "display_name": "GPT-3.5-turbo", "modalities": { "input": [ "text" @@ -52370,30 +50424,29 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 16385, + "output": 4096 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "knowledge": "2021-09-01", + "release_date": "2023-03-01", + "last_updated": "2023-11-06", "cost": { - "input": 1.35, - "output": 5.4 - }, - "type": "chat" + "input": 0.5, + "output": 1.5, + "cache_read": 1.25 + } }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "gpt-5.2-pro", + "name": "GPT-5.2 Pro", + "display_name": "GPT-5.2 Pro", "modalities": { "input": [ "text", @@ -52404,7 +50457,7 @@ ] }, "limit": { - "context": 272000, + "context": 400000, "output": 128000 }, "temperature": false, @@ -52415,20 +50468,49 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 21, + "output": 168 + } + }, + { + "id": "text-embedding-3-large", + "name": "text-embedding-3-large", + "display_name": "text-embedding-3-large", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] }, - "type": "chat" + "limit": { + "context": 8191, + "output": 3072 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-01", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", + "cost": { + "input": 0.13, + "output": 0 + } }, { - "id": "gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ "text", @@ -52440,7 +50522,7 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 4096 }, "temperature": true, "tool_call": true, @@ -52449,20 +50531,18 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 - }, - "type": "chat" + "input": 10, + "output": 30 + } }, { - "id": "phi-4-reasoning-plus", - "name": "Phi-4-reasoning-plus", - "display_name": "Phi-4-reasoning-plus", + "id": "o1-preview", + "name": "o1-preview", + "display_name": "o1-preview", "modalities": { "input": [ "text" @@ -52472,8 +50552,8 @@ ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": false, @@ -52482,20 +50562,20 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 0.125, - "output": 0.5 - }, - "type": "chat" + "input": 15, + "output": 60, + "cache_read": 7.5 + } }, { - "id": "gpt-4-turbo-vision", - "name": "GPT-4 Turbo Vision", - "display_name": "GPT-4 Turbo Vision", + "id": "gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex mini", + "display_name": "GPT-5.1 Codex mini", "modalities": { "input": [ "text", @@ -52506,29 +50586,30 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 10, - "output": 30 - }, - "type": "chat" + "input": 0.25, + "output": 2, + "cache_read": 0.025 + } }, { - "id": "phi-4-reasoning", - "name": "Phi-4-reasoning", - "display_name": "Phi-4-reasoning", + "id": "o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ "text" @@ -52538,60 +50619,96 @@ ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 0.125, - "output": 0.5 - }, - "type": "chat" + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + } }, { - "id": "phi-3-medium-4k-instruct", - "name": "Phi-3-medium-instruct (4k)", - "display_name": "Phi-3-medium-instruct (4k)", + "id": "gpt-5.2-chat-latest", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 128000, + "output": 16384 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.17, - "output": 0.68 + "input": 1.75, + "output": 14, + "cache_read": 0.175 + } + }, + { + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] }, - "type": "chat" + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.13 + } }, { - "id": "codex-mini", + "id": "codex-mini-latest", "name": "Codex Mini", "display_name": "Codex Mini", "modalities": { @@ -52621,13 +50738,12 @@ "input": 1.5, "output": 6, "cache_read": 0.375 - }, - "type": "chat" + } }, { - "id": "o3", - "name": "o3", - "display_name": "o3", + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ "text", @@ -52638,8 +50754,8 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -52649,94 +50765,97 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 - }, - "type": "chat" + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 + } }, { - "id": "mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.15, - "output": 0.15 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.125 + } }, { - "id": "gpt-3.5-turbo-instruct", - "name": "GPT-3.5 Turbo Instruct", - "display_name": "GPT-3.5 Turbo Instruct", + "id": "gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-09-21", - "last_updated": "2023-09-21", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "cost": { - "input": 1.5, - "output": 2 - }, - "type": "chat" + "input": 2.5, + "output": 10, + "cache_read": 1.25 + } }, { - "id": "meta-llama-3.1-8b-instruct", - "name": "Meta-Llama-3.1-8B-Instruct", - "display_name": "Meta-Llama-3.1-8B-Instruct", + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 1047576, "output": 32768 }, "temperature": true, @@ -52744,82 +50863,55 @@ "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", - "cost": { - "input": 0.3, - "output": 0.61 - }, - "type": "chat" - }, - { - "id": "text-embedding-ada-002", - "name": "text-embedding-ada-002", - "display_name": "text-embedding-ada-002", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 1536 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2022-12-15", - "last_updated": "2022-12-15", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.1, - "output": 0 - }, - "type": "embedding" + "input": 2, + "output": 8, + "cache_read": 0.5 + } }, { - "id": "cohere-embed-v3-english", - "name": "Embed v3 English", - "display_name": "Embed v3 English", + "id": "o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 512, - "output": 1024 + "context": 200000, + "output": 100000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2023-11-07", - "last_updated": "2023-11-07", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.1, - "output": 0 - }, - "type": "chat" + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 + } }, { - "id": "llama-4-scout-17b-16e-instruct", - "name": "Llama 4 Scout 17B 16E Instruct", - "display_name": "Llama 4 Scout 17B 16E Instruct", + "id": "o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ "text", @@ -52830,40 +50922,43 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 0.2, - "output": 0.78 - }, - "type": "chat" + "input": 15, + "output": 60, + "cache_read": 7.5 + } }, { - "id": "o1-mini", - "name": "o1-mini", - "display_name": "o1-mini", + "id": "gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -52871,17 +50966,16 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 - }, - "type": "chat" + "input": 1.75, + "output": 14, + "cache_read": 0.175 + } }, { "id": "gpt-5-mini", @@ -52897,7 +50991,7 @@ ] }, "limit": { - "context": 272000, + "context": 400000, "output": 128000 }, "temperature": false, @@ -52914,14 +51008,13 @@ "cost": { "input": 0.25, "output": 2, - "cache_read": 0.03 - }, - "type": "chat" + "cache_read": 0.025 + } }, { - "id": "phi-3.5-moe-instruct", - "name": "Phi-3.5-MoE-instruct", - "display_name": "Phi-3.5-MoE-instruct", + "id": "o1-mini", + "name": "o1-mini", + "display_name": "o1-mini", "modalities": { "input": [ "text" @@ -52932,66 +51025,29 @@ }, "limit": { "context": 128000, - "output": 4096 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", - "cost": { - "input": 0.16, - "output": 0.64 - }, - "type": "chat" - }, - { - "id": "gpt-5.1-chat", - "name": "GPT-5.1 Chat", - "display_name": "GPT-5.1 Chat", - "modalities": { - "input": [ - "text", - "image", - "audio" - ], - "output": [ - "text", - "image", - "audio" - ] - }, - "limit": { - "context": 128000, - "output": 16384 + "output": 65536 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 - }, - "type": "chat" + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + } }, { - "id": "grok-3-mini", - "name": "Grok 3 Mini", - "display_name": "Grok 3 Mini", + "id": "text-embedding-ada-002", + "name": "text-embedding-ada-002", + "display_name": "text-embedding-ada-002", "modalities": { "input": [ "text" @@ -53001,32 +51057,28 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2022-12", + "release_date": "2022-12-15", + "last_updated": "2022-12-15", "cost": { - "input": 0.3, - "output": 0.5, - "reasoning": 0.5, - "cache_read": 0.075 - }, - "type": "chat" + "input": 0.1, + "output": 0 + } }, { - "id": "o1", - "name": "o1", - "display_name": "o1", + "id": "o3-pro", + "name": "o3-pro", + "display_name": "o3-pro", "modalities": { "input": [ "text", @@ -53046,89 +51098,87 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "knowledge": "2024-05", + "release_date": "2025-06-10", + "last_updated": "2025-06-10", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 - }, - "type": "chat" + "input": 20, + "output": 80 + } }, { - "id": "meta-llama-3-8b-instruct", - "name": "Meta-Llama-3-8B-Instruct", - "display_name": "Meta-Llama-3-8B-Instruct", + "id": "gpt-4o-2024-11-20", + "name": "GPT-4o (2024-11-20)", + "display_name": "GPT-4o (2024-11-20)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-11-20", + "last_updated": "2024-11-20", "cost": { - "input": 0.3, - "output": 0.61 - }, - "type": "chat" + "input": 2.5, + "output": 10, + "cache_read": 1.25 + } }, { - "id": "phi-4-multimodal", - "name": "Phi-4-multimodal", - "display_name": "Phi-4-multimodal", + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", "modalities": { "input": [ "text", - "image", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.08, - "output": 0.32, - "input_audio": 4 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.125 + } }, { - "id": "o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ "text", @@ -53154,16 +51204,15 @@ "release_date": "2025-04-16", "last_updated": "2025-04-16", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 - }, - "type": "chat" + "input": 2, + "output": 8, + "cache_read": 0.5 + } }, { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "o4-mini-deep-research", + "name": "o4-mini-deep-research", + "display_name": "o4-mini-deep-research", "modalities": { "input": [ "text", @@ -53174,94 +51223,96 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, "knowledge": "2024-05", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2024-06-26", + "last_updated": "2024-06-26", "cost": { "input": 2, "output": 8, "cache_read": 0.5 - }, - "type": "chat" + } }, { - "id": "ministral-3b", - "name": "Ministral 3B", - "display_name": "Ministral 3B", + "id": "gpt-5-chat-latest", + "name": "GPT-5 Chat (latest)", + "display_name": "GPT-5 Chat (latest)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-03", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.04, - "output": 0.04 - }, - "type": "chat" + "input": 1.25, + "output": 10 + } }, { - "id": "gpt-3.5-turbo-0301", - "name": "GPT-3.5 Turbo 0301", - "display_name": "GPT-3.5 Turbo 0301", + "id": "gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-03-01", - "last_updated": "2023-03-01", + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 1.5, - "output": 2 - }, - "type": "chat" + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 + } }, { - "id": "gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ "text", @@ -53272,62 +51323,63 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", - "cost": { - "input": 2.5, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 1.25, "output": 10, - "cache_read": 1.25 - }, - "type": "chat" + "cache_read": 0.125 + } }, { - "id": "phi-3-mini-128k-instruct", - "name": "Phi-3-mini-instruct (128k)", - "display_name": "Phi-3-mini-instruct (128k)", + "id": "gpt-5-pro", + "name": "GPT-5 Pro", + "display_name": "GPT-5 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 400000, + "output": 272000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "cost": { - "input": 0.13, - "output": 0.52 - }, - "type": "chat" + "input": 15, + "output": 120 + } }, { - "id": "llama-3.2-90b-vision-instruct", - "name": "Llama-3.2-90B-Vision-Instruct", - "display_name": "Llama-3.2-90B-Vision-Instruct", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", @@ -53338,29 +51390,30 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 2.04, - "output": 2.04 - }, - "type": "chat" + "input": 1.75, + "output": 14, + "cache_read": 0.175 + } }, { - "id": "gpt-5-codex", - "name": "GPT-5-Codex", - "display_name": "GPT-5-Codex", + "id": "gpt-5.1-chat-latest", + "name": "GPT-5.1 Chat", + "display_name": "GPT-5.1 Chat", "modalities": { "input": [ "text", @@ -53371,8 +51424,8 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 16384 }, "temperature": false, "tool_call": true, @@ -53380,95 +51433,98 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { "input": 1.25, "output": 10, - "cache_read": 0.13 - }, - "type": "chat" - }, + "cache_read": 0.125 + } + } + ] + }, + "zhipuai-coding-plan": { + "id": "zhipuai-coding-plan", + "name": "Zhipu AI Coding Plan", + "display_name": "Zhipu AI Coding Plan", + "api": "https://open.bigmodel.cn/api/coding/paas/v4", + "doc": "https://docs.bigmodel.cn/cn/coding-plan/overview", + "models": [ { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "glm-4.6v-flash", + "name": "GLM-4.6V-Flash", + "display_name": "GLM-4.6V-Flash", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 128000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.01 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "glm-4.6v", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ "text", "image", - "audio" + "video" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 128000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" @@ -53478,62 +51534,65 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 - }, - "type": "chat" + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } }, { - "id": "model-router", - "name": "Model Router", - "display_name": "Model Router", + "id": "glm-4.5v", + "name": "GLM-4.5V", + "display_name": "GLM-4.5V", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 64000, "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": false, - "release_date": "2025-05-19", - "last_updated": "2025-11-18", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "cost": { - "input": 0.14, + "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ "text" @@ -53543,8 +51602,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -53554,55 +51613,54 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-12-02", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 - }, - "type": "chat" + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } }, { - "id": "gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex Mini", - "display_name": "GPT-5.1 Codex Mini", + "id": "glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 98304 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 - }, - "type": "chat" + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "glm-4.5-flash", + "name": "GLM-4.5-Flash", + "display_name": "GLM-4.5-Flash", "modalities": { "input": [ "text" @@ -53612,29 +51670,31 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.71, - "output": 0.71 - }, - "type": "chat" + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } }, { - "id": "o1-preview", - "name": "o1-preview", - "display_name": "o1-preview", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -53644,31 +51704,40 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 16.5, - "output": 66, - "cache_read": 8.25 - }, - "type": "chat" - }, + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } + } + ] + }, + "minimax-cn": { + "id": "minimax-cn", + "name": "MiniMax (minimaxi.com)", + "display_name": "MiniMax (minimaxi.com)", + "api": "https://api.minimaxi.com/anthropic/v1", + "doc": "https://platform.minimaxi.com/docs/guides/quickstart", + "models": [ { - "id": "phi-3.5-mini-instruct", - "name": "Phi-3.5-mini-instruct", - "display_name": "Phi-3.5-mini-instruct", + "id": "MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" @@ -53678,29 +51747,28 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 204800, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.13, - "output": 0.52 - }, - "type": "chat" + "input": 0.3, + "output": 1.2 + } }, { - "id": "gpt-3.5-turbo-0613", - "name": "GPT-3.5 Turbo 0613", - "display_name": "GPT-3.5 Turbo 0613", + "id": "MiniMax-M2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ "text" @@ -53710,33 +51778,39 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 196608, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-06-13", - "last_updated": "2023-06-13", + "open_weights": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 3, - "output": 4 - }, - "type": "chat" - }, + "input": 0.3, + "output": 1.2 + } + } + ] + }, + "perplexity": { + "id": "perplexity", + "name": "Perplexity", + "display_name": "Perplexity", + "doc": "https://docs.perplexity.ai", + "models": [ { - "id": "gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "sonar", + "name": "Sonar", + "display_name": "Sonar", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -53747,89 +51821,98 @@ "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 10, - "output": 30 - }, - "type": "chat" + "input": 1, + "output": 1 + } }, { - "id": "meta-llama-3.1-70b-instruct", - "name": "Meta-Llama-3.1-70B-Instruct", - "display_name": "Meta-Llama-3.1-70B-Instruct", + "id": "sonar-pro", + "name": "Sonar Pro", + "display_name": "Sonar Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 2.68, - "output": 3.54 - }, - "type": "chat" + "input": 3, + "output": 15 + } }, { - "id": "phi-3-small-8k-instruct", - "name": "Phi-3-small-instruct (8k)", - "display_name": "Phi-3-small-instruct (8k)", + "id": "sonar-reasoning-pro", + "name": "Sonar Reasoning Pro", + "display_name": "Sonar Reasoning Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 0.15, - "output": 0.6 - }, - "type": "chat" - }, + "input": 2, + "output": 8 + } + } + ] + }, + "zenmux": { + "id": "zenmux", + "name": "zenmux", + "display_name": "zenmux", + "api": "https://zenmux.ai/api/anthropic/v1", + "doc": "https://docs.zenmux.ai", + "models": [ { - "id": "deepseek-v3-0324", - "name": "DeepSeek-V3-0324", - "display_name": "DeepSeek-V3-0324", + "id": "stepfun/step-3.5-flash-free", + "name": "Step 3.5 Flash (Free)", + "display_name": "Step 3.5 Flash (Free)", "modalities": { "input": [ "text" @@ -53839,31 +51922,32 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2026-02-02", + "last_updated": "2026-02-02", "cost": { - "input": 1.14, - "output": 4.56 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "meta-llama-3-70b-instruct", - "name": "Meta-Llama-3-70B-Instruct", - "display_name": "Meta-Llama-3-70B-Instruct", + "id": "stepfun/step-3", + "name": "Step-3", + "display_name": "Step-3", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -53871,29 +51955,29 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 65536, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-07-31", + "last_updated": "2025-07-31", "cost": { - "input": 2.68, - "output": 3.54 - }, - "type": "chat" + "input": 0.21, + "output": 0.57 + } }, { - "id": "text-embedding-3-large", - "name": "text-embedding-3-large", - "display_name": "text-embedding-3-large", + "id": "stepfun/step-3.5-flash", + "name": "Step 3.5 Flash", + "display_name": "Step 3.5 Flash", "modalities": { "input": [ "text" @@ -53903,27 +51987,29 @@ ] }, "limit": { - "context": 8191, - "output": 3072 + "context": 256000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "knowledge": "2025-01-01", + "release_date": "2026-02-02", + "last_updated": "2026-02-02", "cost": { - "input": 0.13, - "output": 0 - }, - "type": "embedding" + "input": 0.1, + "output": 0.3 + } }, { - "id": "grok-3", - "name": "Grok 3", - "display_name": "Grok 3", + "id": "moonshotai/kimi-k2-thinking-turbo", + "name": "Kimi K2 Thinking Turbo", + "display_name": "Kimi K2 Thinking Turbo", "modalities": { "input": [ "text" @@ -53933,99 +52019,98 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", + "knowledge": "2025-01-01", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 - }, - "type": "chat" + "input": 1.15, + "output": 8, + "cache_read": 0.15 + } }, { - "id": "gpt-3.5-turbo-0125", - "name": "GPT-3.5 Turbo 0125", - "display_name": "GPT-3.5 Turbo 0125", + "id": "moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 262000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2021-08", - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "knowledge": "2025-01-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.5, - "output": 1.5 - }, - "type": "chat" + "input": 0.58, + "output": 3.02, + "cache_read": 0.1 + } }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "moonshotai/kimi-k2-0905", + "name": "MoonshotAI: Kimi K2 0905", + "display_name": "MoonshotAI: Kimi K2 0905", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2025-01-01", + "release_date": "2025-09-04", + "last_updated": "2025-09-04", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "phi-4-mini-reasoning", - "name": "Phi-4-mini-reasoning", - "display_name": "Phi-4-mini-reasoning", + "id": "moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -54035,8 +52120,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -54045,20 +52130,20 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.075, - "output": 0.3 - }, - "type": "chat" + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 + } }, { - "id": "phi-4", - "name": "Phi-4", - "display_name": "Phi-4", + "id": "xiaomi/mimo-v2-flash-free", + "name": "MiMo-V2-Flash Free", + "display_name": "MiMo-V2-Flash Free", "modalities": { "input": [ "text" @@ -54068,29 +52153,29 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.125, - "output": 0.5 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "deepseek-v3.1", - "name": "DeepSeek-V3.1", - "display_name": "DeepSeek-V3.1", + "id": "xiaomi/mimo-v2-flash", + "name": "MiMo-V2-Flash", + "display_name": "MiMo-V2-Flash", "modalities": { "input": [ "text" @@ -54100,8 +52185,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -54110,89 +52195,87 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.56, - "output": 1.68 - }, - "type": "chat" + "input": 0.1, + "output": 0.3, + "cache_read": 0.01 + } }, { - "id": "gpt-5-chat", - "name": "GPT-5 Chat", - "display_name": "GPT-5 Chat", + "id": "x-ai/grok-4", + "name": "Grok 4", + "display_name": "Grok 4", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 256000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10-24", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-07", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.75, + "reasoning": 15 + } }, { - "id": "gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "x-ai/grok-code-fast-1", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 256000, + "output": 10000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2023-10", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 - }, - "type": "chat" + "input": 0.2, + "output": 1.5, + "cache_read": 0.02 + } }, { - "id": "llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama 4 Maverick 17B 128E Instruct FP8", - "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", + "id": "x-ai/grok-4.1-fast-non-reasoning", + "name": "Grok 4.1 Fast Non Reasoning", + "display_name": "Grok 4.1 Fast Non Reasoning", "modalities": { "input": [ "text", @@ -54203,8 +52286,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 2000000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -54212,31 +52295,32 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "cost": { - "input": 0.25, - "output": 1 - }, - "type": "chat" + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + } }, { - "id": "cohere-command-r-plus-08-2024", - "name": "Command R+", - "display_name": "Command R+", + "id": "x-ai/grok-4-fast", + "name": "Grok 4 Fast", + "display_name": "Grok 4 Fast", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -54244,32 +52328,33 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "attachment": true, + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 2.5, - "output": 10 - }, - "type": "chat" + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + } }, { - "id": "cohere-command-a", - "name": "Command A", - "display_name": "Command A", + "id": "x-ai/grok-4.1-fast", + "name": "Grok 4.1 Fast", + "display_name": "Grok 4.1 Fast", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8000 + "context": 2000000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -54277,21 +52362,21 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "cost": { - "input": 2.5, - "output": 10 - }, - "type": "chat" + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + } }, { - "id": "phi-3-small-128k-instruct", - "name": "Phi-3-small-instruct (128k)", - "display_name": "Phi-3-small-instruct (128k)", + "id": "deepseek/deepseek-chat", + "name": "DeepSeek: DeepSeek V3", + "display_name": "DeepSeek: DeepSeek V3", "modalities": { "input": [ "text" @@ -54301,41 +52386,40 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 163840, + "output": 163840 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.28, + "output": 0.42, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "deepseek/deepseek-v3.2-exp", + "name": "DeepSeek-V3.2-Exp", + "display_name": "DeepSeek-V3.2-Exp", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 163000, "output": 64000 }, "temperature": true, @@ -54344,27 +52428,23 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "knowledge": "2025-01-01", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 5, - "output": 25, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" + "input": 0.22, + "output": 0.33 + } }, { - "id": "mistral-medium-2505", - "name": "Mistral Medium 3", - "display_name": "Mistral Medium 3", + "id": "deepseek/deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -54372,28 +52452,28 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "knowledge": "2025-01-01", + "release_date": "2025-12-05", + "last_updated": "2025-12-05", "cost": { - "input": 0.4, - "output": 2 - }, - "type": "chat" + "input": 0.28, + "output": 0.43 + } }, { - "id": "deepseek-v3.2-speciale", - "name": "DeepSeek-V3.2-Speciale", - "display_name": "DeepSeek-V3.2-Speciale", + "id": "minimax/minimax-m2", + "name": "MiniMax M2", + "display_name": "MiniMax M2", "modalities": { "input": [ "text" @@ -54403,42 +52483,78 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 204000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 0.28, - "output": 0.42 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.38 + } + }, + { + "id": "minimax/minimax-m2.1", + "name": "MiniMax M2.1", + "display_name": "MiniMax M2.1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] }, - "type": "chat" + "limit": { + "context": 204000, + "output": 64000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.38 + } }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "google/gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ "text", "image", - "pdf" + "pdf", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 1048000, "output": 64000 }, "temperature": true, @@ -54449,102 +52565,108 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2025-01-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 - }, - "type": "chat" + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 1 + } }, { - "id": "phi-3-mini-4k-instruct", - "name": "Phi-3-mini-instruct (4k)", - "display_name": "Phi-3-mini-instruct (4k)", + "id": "google/gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "pdf", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 1048000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.13, - "output": 0.52 - }, - "type": "chat" + "input": 2, + "output": 12, + "cache_read": 0.2, + "cache_write": 4.5 + } }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "google/gemini-2.5-flash", + "name": "Google: Gemini 2.5 Flash", + "display_name": "Google: Gemini 2.5 Flash", "modalities": { "input": [ - "text", "image", + "text", "audio" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65535 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "knowledge": "2025-01-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.3, + "output": 2.5, + "cache_read": 0.07, + "cache_write": 1 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "google/gemini-2.5-flash-lite", + "name": "Google: Gemini 2.5 Flash Lite", + "display_name": "Google: Gemini 2.5 Flash Lite", "modalities": { "input": [ - "text" + "image", + "text", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 1048576, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -54552,184 +52674,202 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-10", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "knowledge": "2025-01-01", + "release_date": "2025-07-22", + "last_updated": "2025-07-22", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "input": 0.1, + "output": 0.4, + "cache_read": 0.03, + "cache_write": 1 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "google/gemini-2.5-pro", + "name": "Google: Gemini 2.5 Pro", + "display_name": "Google: Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "image", + "text", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 1.35, - "output": 5.4 + "input": 1.25, + "output": 10, + "cache_read": 0.31, + "cache_write": 4.5 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "meta-llama-3.1-405b-instruct", - "name": "Meta-Llama-3.1-405B-Instruct", - "display_name": "Meta-Llama-3.1-405B-Instruct", + "id": "volcengine/doubao-seed-code", + "name": "Doubao-Seed-Code", + "display_name": "Doubao-Seed-Code", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-11-11", + "last_updated": "2025-11-11", "cost": { - "input": 5.33, - "output": 16 - }, - "type": "chat" + "input": 0.17, + "output": 1.12, + "cache_read": 0.03 + } }, { - "id": "gpt-4-32k", - "name": "GPT-4 32K", - "display_name": "GPT-4 32K", + "id": "volcengine/doubao-seed-1.8", + "name": "Doubao-Seed-1.8", + "display_name": "Doubao-Seed-1.8", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-03-14", - "last_updated": "2023-03-14", + "knowledge": "2025-01-01", + "release_date": "2025-12-18", + "last_updated": "2025-12-18", "cost": { - "input": 60, - "output": 120 - }, - "type": "chat" + "input": 0.11, + "output": 0.28, + "cache_read": 0.02, + "cache_write": 0.0024 + } }, { - "id": "phi-4-mini", - "name": "Phi-4-mini", - "display_name": "Phi-4-mini", + "id": "openai/gpt-5.2-codex", + "name": "GPT-5.2-Codex", + "display_name": "GPT-5.2-Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 400000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2026-01-15", + "last_updated": "2026-01-15", "cost": { - "input": 0.075, - "output": 0.3 - }, - "type": "chat" + "input": 1.75, + "output": 14, + "cache_read": 0.17 + } }, { - "id": "cohere-embed-v3-multilingual", - "name": "Embed v3 Multilingual", - "display_name": "Embed v3 Multilingual", + "id": "openai/gpt-5.1-codex", + "name": "GPT-5.1-Codex", + "display_name": "GPT-5.1-Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 512, - "output": 1024 + "context": 400000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2023-11-07", - "last_updated": "2023-11-07", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.1, - "output": 0 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.12 + } }, { - "id": "grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "openai/gpt-5.1-codex-mini", + "name": "GPT-5.1-Codex-Mini", + "display_name": "GPT-5.1-Codex-Mini", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -54737,7 +52877,7 @@ ] }, "limit": { - "context": 256000, + "context": 400000, "output": 64000 }, "temperature": true, @@ -54746,34 +52886,34 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "knowledge": "2025-01-01", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 3, - "output": 15, - "reasoning": 15, - "cache_read": 0.75 - }, - "type": "chat" + "input": 0.25, + "output": 2, + "cache_read": 0.03 + } }, { - "id": "cohere-command-r-08-2024", - "name": "Command R", - "display_name": "Command R", + "id": "openai/gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "image", + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 400000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -54781,21 +52921,21 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.15, - "output": 0.6 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.12 + } }, { - "id": "cohere-embed-v-4-0", - "name": "Embed v4", - "display_name": "Embed v4", + "id": "openai/gpt-5-codex", + "name": "GPT-5 Codex", + "display_name": "GPT-5 Codex", "modalities": { "input": [ "text", @@ -54806,32 +52946,35 @@ ] }, "limit": { - "context": 128000, - "output": 1536 + "context": 400000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.12, - "output": 0 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.12 + } }, { - "id": "llama-3.2-11b-vision-instruct", - "name": "Llama-3.2-11B-Vision-Instruct", - "display_name": "Llama-3.2-11B-Vision-Instruct", + "id": "openai/gpt-5.1-chat", + "name": "GPT-5.1 Chat", + "display_name": "GPT-5.1 Chat", "modalities": { "input": [ - "text", - "image" + "pdf", + "image", + "text" ], "output": [ "text" @@ -54839,7 +52982,7 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 64000 }, "temperature": true, "tool_call": true, @@ -54847,20 +52990,20 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.37, - "output": 0.37 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.12 + } }, { - "id": "gpt-5.2-chat", - "name": "GPT-5.2 Chat", - "display_name": "GPT-5.2 Chat", + "id": "openai/gpt-5", + "name": "gpt-5", + "display_name": "gpt-5", "modalities": { "input": [ "text", @@ -54871,8 +53014,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 272000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -54882,24 +53025,24 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "claude-opus-4-1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text", "image", + "text", "pdf" ], "output": [ @@ -54907,8 +53050,8 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 400000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -54918,53 +53061,53 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2025-01-01", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" + "input": 1.75, + "output": 14, + "cache_read": 0.17 + } }, { - "id": "gpt-4", - "name": "GPT-4", - "display_name": "GPT-4", + "id": "baidu/ernie-5.0-thinking-preview", + "name": "ERNIE 5.0", + "display_name": "ERNIE 5.0", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, + "supported": true, + "default": true + }, + "attachment": true, "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-03-14", - "last_updated": "2023-03-14", + "knowledge": "2025-01-01", + "release_date": "2026-01-22", + "last_updated": "2026-01-22", "cost": { - "input": 60, - "output": 120 - }, - "type": "chat" + "input": 0.84, + "output": 3.37 + } }, { - "id": "phi-3-medium-128k-instruct", - "name": "Phi-3-medium-instruct (128k)", - "display_name": "Phi-3-medium-instruct (128k)", + "id": "inclusionai/ring-1t", + "name": "inclusionAI: Ring 1T", + "display_name": "inclusionAI: Ring 1T", "modalities": { "input": [ "text" @@ -54974,64 +53117,64 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-10-12", + "last_updated": "2025-10-12", "cost": { - "input": 0.17, - "output": 0.68 + "input": 0.56, + "output": 2.24, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "grok-4-fast-reasoning", - "name": "Grok 4 Fast (Reasoning)", - "display_name": "Grok 4 Fast (Reasoning)", + "id": "inclusionai/ling-1t", + "name": "inclusionAI: Ling-1T", + "display_name": "inclusionAI: Ling-1T", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "knowledge": "2025-01-01", + "release_date": "2025-10-09", + "last_updated": "2025-10-09", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.56, + "output": 2.24, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "deepseek-r1-0528", - "name": "DeepSeek-R1-0528", - "display_name": "DeepSeek-R1-0528", + "id": "z-ai/glm-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ "text" @@ -55041,8 +53184,8 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -55051,127 +53194,123 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 1.35, - "output": 5.4 - }, - "type": "chat" + "input": 0.28, + "output": 1.14, + "cache_read": 0.06 + } }, { - "id": "grok-4-fast-non-reasoning", - "name": "Grok 4 Fast (Non-Reasoning)", - "display_name": "Grok 4 Fast (Non-Reasoning)", + "id": "z-ai/glm-4.6v-flash-free", + "name": "GLM 4.6V Flash (Free)", + "display_name": "GLM 4.6V Flash (Free)", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "knowledge": "2025-01-01", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "text-embedding-3-small", - "name": "text-embedding-3-small", - "display_name": "text-embedding-3-small", + "id": "z-ai/glm-4.6v-flash", + "name": "GLM 4.6V FlashX", + "display_name": "GLM 4.6V FlashX", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 8191, - "output": 1536 + "context": 200000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "knowledge": "2025-01-01", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { "input": 0.02, - "output": 0 - }, - "type": "embedding" + "output": 0.21, + "cache_read": 0.0043 + } }, { - "id": "gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", + "id": "z-ai/glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.03 - }, - "type": "chat" - } - ] - }, - "llama": { - "id": "llama", - "name": "Llama", - "display_name": "Llama", - "api": "https://api.llama.com/compat/v1/", - "doc": "https://llama.developer.meta.com/docs/models", - "models": [ + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 + } + }, { - "id": "llama-3.3-8b-instruct", - "name": "Llama-3.3-8B-Instruct", - "display_name": "Llama-3.3-8B-Instruct", + "id": "z-ai/glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ "text" @@ -55181,62 +53320,65 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.2, + "output": 1.1, + "cache_read": 0.03, + "cache_write": 0 + } }, { - "id": "llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", - "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "id": "z-ai/glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 + } }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "z-ai/glm-4.7-flash-free", + "name": "GLM 4.7 Flash (Free)", + "display_name": "GLM 4.7 Flash (Free)", "modalities": { "input": [ "text" @@ -55246,94 +53388,97 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "attachment": false, + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { "input": 0, "output": 0 - }, - "type": "chat" + } }, { - "id": "llama-4-scout-17b-16e-instruct-fp8", - "name": "Llama-4-Scout-17B-16E-Instruct-FP8", - "display_name": "Llama-4-Scout-17B-16E-Instruct-FP8", + "id": "z-ai/glm-4.7-flashx", + "name": "GLM 4.7 FlashX", + "display_name": "GLM 4.7 FlashX", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "attachment": false, + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.07, + "output": 0.42, + "cache_read": 0.01 + } }, { - "id": "groq-llama-4-maverick-17b-128e-instruct", - "name": "Groq-Llama-4-Maverick-17B-128E-Instruct", - "display_name": "Groq-Llama-4-Maverick-17B-128E-Instruct", + "id": "z-ai/glm-4.6v", + "name": "GLM 4.6V", + "display_name": "GLM 4.6V", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "input": 0.14, + "output": 0.42, + "cache_read": 0.03 + } }, { - "id": "cerebras-llama-4-scout-17b-16e-instruct", - "name": "Cerebras-Llama-4-Scout-17B-16E-Instruct", - "display_name": "Cerebras-Llama-4-Scout-17B-16E-Instruct", + "id": "qwen/qwen3-max", + "name": "Qwen: Qwen3 Max", + "display_name": "Qwen: Qwen3 Max", "modalities": { "input": [ "text" @@ -55343,29 +53488,29 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 256000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "attachment": false, + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2026-01-23", + "last_updated": "2026-01-23", "cost": { - "input": 0, - "output": 0 + "input": 1.2, + "output": 6 }, "type": "chat" }, { - "id": "cerebras-llama-4-maverick-17b-128e-instruct", - "name": "Cerebras-Llama-4-Maverick-17B-128E-Instruct", - "display_name": "Cerebras-Llama-4-Maverick-17B-128E-Instruct", + "id": "qwen/qwen3-coder-plus", + "name": "Qwen: Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen: Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" @@ -55375,38 +53520,30 @@ ] }, "limit": { - "context": 128000, + "context": 4096, "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "attachment": false, + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - } - ] - }, - "scaleway": { - "id": "scaleway", - "name": "Scaleway", - "display_name": "Scaleway", - "api": "https://api.scaleway.ai/v1", - "doc": "https://www.scaleway.com/en/docs/generative-apis/", - "models": [ + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 + } + }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "kuaishou/kat-coder-pro-v1-free", + "name": "KAT-Coder-Pro-V1 Free", + "display_name": "KAT-Coder-Pro-V1 Free", "modalities": { "input": [ "text" @@ -55416,28 +53553,28 @@ ] }, "limit": { - "context": 260000, - "output": 8192 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "attachment": false, + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-10-23", + "last_updated": "2025-10-23", "cost": { - "input": 0.75, - "output": 2.25 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "devstral-2-123b-instruct-2512", - "name": "Devstral 2 123B Instruct (2512)", - "display_name": "Devstral 2 123B Instruct (2512)", + "id": "kuaishou/kat-coder-pro-v1", + "name": "KAT-Coder-Pro-V1", + "display_name": "KAT-Coder-Pro-V1", "modalities": { "input": [ "text" @@ -55448,7 +53585,7 @@ }, "limit": { "context": 256000, - "output": 8192 + "output": 64000 }, "temperature": true, "tool_call": true, @@ -55456,19 +53593,20 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-01-07", - "last_updated": "2026-01-07", + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-10-23", + "last_updated": "2025-10-23", "cost": { - "input": 0.4, - "output": 2 - }, - "type": "chat" + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 + } }, { - "id": "pixtral-12b-2409", - "name": "Pixtral 12B 2409", - "display_name": "Pixtral 12B 2409", + "id": "anthropic/claude-opus-4", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ "text", @@ -55479,30 +53617,34 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.2, - "output": 0.2 - }, - "type": "chat" + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } }, { - "id": "llama-3.1-8b-instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "anthropic/claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -55510,39 +53652,41 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.2, - "output": 0.2 - }, - "type": "chat" + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 + } }, { - "id": "mistral-nemo-instruct-2407", - "name": "Mistral Nemo Instruct 2407", - "display_name": "Mistral Nemo Instruct 2407", - "modalities": { + "id": "anthropic/claude-3.5-sonnet", + "name": "Claude Sonnet 3.5 v2", + "display_name": "Claude Sonnet 3.5 v2", + "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 200000, "output": 8192 }, "temperature": true, @@ -55551,19 +53695,21 @@ "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2024-07-25", - "last_updated": "2024-07-25", + "open_weights": false, + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.2, - "output": 0.2 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "mistral-small-3.2-24b-instruct-2506", - "name": "Mistral Small 3.2 24B Instruct (2506)", - "display_name": "Mistral Small 3.2 24B Instruct (2506)", + "id": "anthropic/claude-opus-4.1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ "text", @@ -55574,71 +53720,78 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-06-20", - "last_updated": "2025-06-20", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.15, - "output": 0.35 - }, - "type": "chat" + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3-Coder 30B-A3B Instruct", - "display_name": "Qwen3-Coder 30B-A3B Instruct", + "id": "anthropic/claude-3.7-sonnet", + "name": "Claude Sonnet 3.7", + "display_name": "Claude Sonnet 3.7", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-31", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.2, - "output": 0.8 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "anthropic/claude-3.5-haiku", + "name": "Claude Haiku 3.5", + "display_name": "Claude Haiku 3.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 100000, - "output": 4096 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -55646,54 +53799,60 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": false, + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.9, - "output": 0.9 - }, - "type": "chat" + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 + } }, { - "id": "whisper-large-v3", - "name": "Whisper Large v3", - "display_name": "Whisper Large v3", + "id": "anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ - "audio" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 200000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-09", - "release_date": "2023-09-01", - "last_updated": "2025-09-05", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.003, - "output": 0 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "anthropic/claude-opus-4.5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ + "pdf", + "image", "text" ], "output": [ @@ -55701,8 +53860,8 @@ ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -55710,53 +53869,57 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.9, - "output": 0.9 - }, - "type": "chat" + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + } }, { - "id": "voxtral-small-24b-2507", - "name": "Voxtral Small 24B 2507", - "display_name": "Voxtral Small 24B 2507", + "id": "anthropic/claude-sonnet-4.5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.15, - "output": 0.35 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "gpt-oss-120b", - "name": "GPT-OSS 120B", - "display_name": "GPT-OSS 120B", + "id": "deepseek/deepseek-chat-v3.1", + "name": "DeepSeek: DeepSeek V3.1", + "display_name": "DeepSeek: DeepSeek V3.1", "modalities": { "input": [ "text" @@ -55766,28 +53929,20 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 32768 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "release_date": "2024-01-01", - "last_updated": "2024-01-01", - "cost": { - "input": 0.15, - "output": 0.6 + "supported": true, + "default": true }, "type": "chat" }, { - "id": "bge-multilingual-gemma2", - "name": "BGE Multilingual Gemma2", - "display_name": "BGE Multilingual Gemma2", + "id": "deepseek/deepseek-r1-0528", + "name": "DeepSeek: R1 0528", + "display_name": "DeepSeek: R1 0528", "modalities": { "input": [ "text" @@ -55797,102 +53952,70 @@ ] }, "limit": { - "context": 8191, - "output": 3072 + "context": 163840, + "output": 163840 }, - "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-07-26", - "last_updated": "2025-06-15", - "cost": { - "input": 0.13, - "output": 0 + "supported": true, + "default": true }, "type": "chat" }, { - "id": "gemma-3-27b-it", - "name": "Gemma-3-27B-IT", - "display_name": "Gemma-3-27B-IT", + "id": "google/gemini-2.0-flash", + "name": "Google: Gemini 2.0 Flash", + "display_name": "Google: Gemini 2.0 Flash", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 40000, + "context": 1048576, "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2025-09-05", - "cost": { - "input": 0.25, - "output": 0.5 - }, - "type": "chat" - } - ] - }, - "amazon-bedrock": { - "id": "amazon-bedrock", - "name": "Amazon Bedrock", - "display_name": "Amazon Bedrock", - "doc": "https://docs.aws.amazon.com/bedrock/latest/userguide/models-supported.html", - "models": [ + "type": "imageGeneration" + }, { - "id": "cohere.command-r-plus-v1:0", - "name": "Command R+", - "display_name": "Command R+", + "id": "google/gemini-2.0-flash-lite-001", + "name": "Google: Gemini 2.0 Flash Lite", + "display_name": "Google: Gemini 2.0 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1048576, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-04-04", - "last_updated": "2024-04-04", - "cost": { - "input": 3, - "output": 15 - }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "anthropic.claude-v2", - "name": "Claude 2", - "display_name": "Claude 2", + "id": "inclusionai/ling-flash-2.0", + "name": "inclusionAI: Ling Flash 2.0", + "display_name": "inclusionAI: Ling Flash 2.0", "modalities": { "input": [ "text" @@ -55902,102 +54025,64 @@ ] }, "limit": { - "context": 100000, - "output": 4096 + "context": 131072, + "output": 131072 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2023-08", - "release_date": "2023-07-11", - "last_updated": "2023-07-11", - "cost": { - "input": 8, - "output": 24 - }, "type": "chat" }, { - "id": "anthropic.claude-3-7-sonnet-20250219-v1:0", - "name": "Claude Sonnet 3.7", - "display_name": "Claude Sonnet 3.7", + "id": "inclusionai/ling-mini-2.0", + "name": "inclusionAI: Ling Mini 2.0", + "display_name": "inclusionAI: Ling Mini 2.0", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 131072, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, "type": "chat" }, { - "id": "anthropic.claude-sonnet-4-20250514-v1:0", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "inclusionai/ring-flash-2.0", + "name": "inclusionAI: Ring Flash 2.0", + "display_name": "inclusionAI: Ring Flash 2.0", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, "type": "chat" }, { - "id": "qwen.qwen3-coder-30b-a3b-v1:0", - "name": "Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen3 Coder 30B A3B Instruct", + "id": "inclusionai/ring-mini-2.0", + "name": "inclusionAI: Ring Mini 2.0", + "display_name": "inclusionAI: Ring Mini 2.0", "modalities": { "input": [ "text" @@ -56007,33 +54092,23 @@ ] }, "limit": { - "context": 262144, + "context": 131072, "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", - "cost": { - "input": 0.15, - "output": 0.6 + "supported": true, + "default": true }, "type": "chat" }, { - "id": "google.gemma-3-4b-it", - "name": "Gemma 3 4B IT", - "display_name": "Gemma 3 4B IT", + "id": "moonshotai/kimi-k2-0711", + "name": "kimi-k2-0711", + "display_name": "kimi-k2-0711", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -56041,59 +54116,51 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", - "cost": { - "input": 0.04, - "output": 0.08 - }, "type": "chat" }, { - "id": "minimax.minimax-m2", - "name": "MiniMax M2", - "display_name": "MiniMax M2", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204608, - "output": 128000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.3, - "output": 1.2 - }, - "type": "chat" + "input": 2, + "output": 8, + "cache_read": 0.5 + } }, { - "id": "meta.llama3-2-11b-instruct-v1:0", - "name": "Llama 3.2 11B Instruct", - "display_name": "Llama 3.2 11B Instruct", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ "text", @@ -56104,8 +54171,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -56113,64 +54180,65 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.16, - "output": 0.16 - }, - "type": "chat" + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 + } }, { - "id": "qwen.qwen3-next-80b-a3b", - "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "id": "openai/gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.14, - "output": 1.4 - }, - "type": "chat" + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 + } }, { - "id": "anthropic.claude-3-haiku-20240307-v1:0", - "name": "Claude Haiku 3", - "display_name": "Claude Haiku 3", + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -56179,19 +54247,19 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-02", - "release_date": "2024-03-13", - "last_updated": "2024-03-13", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "cost": { - "input": 0.25, - "output": 1.25 - }, - "type": "chat" + "input": 2.5, + "output": 10, + "cache_read": 1.25 + } }, { - "id": "meta.llama3-2-90b-instruct-v1:0", - "name": "Llama 3.2 90B Instruct", - "display_name": "Llama 3.2 90B Instruct", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ "text", @@ -56203,7 +54271,7 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -56211,20 +54279,30 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.72, - "output": 0.72 + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 + } + }, + { + "id": "openai/gpt-5-chat", + "name": "gpt-5-chat", + "display_name": "gpt-5-chat", + "limit": { + "context": 272000, + "output": 16384 }, "type": "chat" }, { - "id": "qwen.qwen3-vl-235b-a22b", - "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", - "display_name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "id": "openai/gpt-5-mini", + "name": "gpt-5-mini", + "display_name": "gpt-5-mini", "modalities": { "input": [ "text", @@ -56235,63 +54313,70 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.3, - "output": 1.5 + "input": 0.25, + "output": 2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "meta.llama3-2-1b-instruct-v1:0", - "name": "Llama 3.2 1B Instruct", - "display_name": "Llama 3.2 1B Instruct", + "id": "openai/gpt-5-nano", + "name": "gpt-5-nano", + "display_name": "gpt-5-nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 4096 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "anthropic.claude-v2:1", - "name": "Claude 2.1", - "display_name": "Claude 2.1", + "id": "openai/o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -56299,28 +54384,29 @@ }, "limit": { "context": 200000, - "output": 4096 + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-08", - "release_date": "2023-11-21", - "last_updated": "2023-11-21", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 8, - "output": 24 - }, - "type": "chat" + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 + } }, { - "id": "deepseek.v3-v1:0", - "name": "DeepSeek-V3.1", - "display_name": "DeepSeek-V3.1", + "id": "qwen/qwen3-235b-a22b-2507", + "name": "Qwen: Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen: Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -56330,67 +54416,43 @@ ] }, "limit": { - "context": 163840, - "output": 81920 + "context": 262144, + "output": 262144 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", - "cost": { - "input": 0.58, - "output": 1.68 - }, "type": "chat" }, { - "id": "anthropic.claude-opus-4-5-20251101-v1:0", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "qwen/qwen3-235b-a22b-thinking-2507", + "name": "Qwen: Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen: Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 262144 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", - "cost": { - "input": 5, - "output": 25, - "cache_read": 1.5, - "cache_write": 18.75 - }, "type": "chat" }, { - "id": "cohere.command-light-text-v14", - "name": "Command Light", - "display_name": "Command Light", + "id": "qwen/qwen3-coder", + "name": "Qwen: Qwen3 Coder 480B A35B", + "display_name": "Qwen: Qwen3 Coder 480B A35B", "modalities": { "input": [ "text" @@ -56400,60 +54462,45 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 262144, + "output": 262144 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-08", - "release_date": "2023-11-01", - "last_updated": "2023-11-01", - "cost": { - "input": 0.3, - "output": 0.6 + "supported": true, + "default": true }, "type": "chat" }, { - "id": "mistral.mistral-large-2402-v1:0", - "name": "Mistral Large (24.02)", - "display_name": "Mistral Large (24.02)", + "id": "qwen/qwen3-vl-plus", + "name": "Qwen: Qwen3 VL 235B A22B Instruct", + "display_name": "Qwen: Qwen3 VL 235B A22B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", - "cost": { - "input": 0.5, - "output": 1.5 + "supported": true, + "default": true }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "google.gemma-3-27b-it", - "name": "Google Gemma 3 27B Instruct", - "display_name": "Google Gemma 3 27B Instruct", + "id": "x-ai/grok-4-fast-non-reasoning", + "name": "Grok 4 Fast (Non-Reasoning)", + "display_name": "Grok 4 Fast (Non-Reasoning)", "modalities": { "input": [ "text", @@ -56464,8 +54511,8 @@ ] }, "limit": { - "context": 202752, - "output": 8192 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -56473,85 +54520,100 @@ "supported": false }, "attachment": true, - "open_weights": true, + "open_weights": false, "knowledge": "2025-07", - "release_date": "2025-07-27", - "last_updated": "2025-07-27", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 0.12, - "output": 0.2 - }, - "type": "chat" - }, + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + } + } + ] + }, + "minimax-coding-plan": { + "id": "minimax-coding-plan", + "name": "MiniMax Coding Plan (minimax.io)", + "display_name": "MiniMax Coding Plan (minimax.io)", + "api": "https://api.minimax.io/anthropic/v1", + "doc": "https://platform.minimax.io/docs/coding-plan/intro", + "models": [ { - "id": "nvidia.nemotron-nano-12b-v2", - "name": "NVIDIA Nemotron Nano 12B v2 VL BF16", - "display_name": "NVIDIA Nemotron Nano 12B v2 VL BF16", + "id": "MiniMax-M2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 196608, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 0.2, - "output": 0.6 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "google.gemma-3-12b-it", - "name": "Google Gemma 3 12B", - "display_name": "Google Gemma 3 12B", + "id": "MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.049999999999999996, - "output": 0.09999999999999999 - }, - "type": "chat" - }, + "input": 0, + "output": 0 + } + } + ] + }, + "ovhcloud": { + "id": "ovhcloud", + "name": "OVHcloud AI Endpoints", + "display_name": "OVHcloud AI Endpoints", + "api": "https://oai.endpoints.kepler.ai.cloud.ovh.net/v1", + "doc": "https://www.ovhcloud.com/en/public-cloud/ai-endpoints/catalog//", + "models": [ { - "id": "ai21.jamba-1-5-large-v1:0", - "name": "Jamba 1.5 Large", - "display_name": "Jamba 1.5 Large", + "id": "mixtral-8x7b-instruct-v0.1", + "name": "Mixtral-8x7B-Instruct-v0.1", + "display_name": "Mixtral-8x7B-Instruct-v0.1", "modalities": { "input": [ "text" @@ -56561,29 +54623,27 @@ ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "release_date": "2025-04-01", + "last_updated": "2025-04-01", "cost": { - "input": 2, - "output": 8 - }, - "type": "chat" + "input": 0.7, + "output": 0.7 + } }, { - "id": "meta.llama3-3-70b-instruct-v1:0", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "mistral-7b-instruct-v0.3", + "name": "Mistral-7B-Instruct-v0.3", + "display_name": "Mistral-7B-Instruct-v0.3", "modalities": { "input": [ "text" @@ -56593,8 +54653,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 65536, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -56603,88 +54663,78 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-04-01", + "last_updated": "2025-04-01", "cost": { - "input": 0.72, - "output": 0.72 - }, - "type": "chat" + "input": 0.11, + "output": 0.11 + } }, { - "id": "anthropic.claude-3-opus-20240229-v1:0", - "name": "Claude Opus 3", - "display_name": "Claude Opus 3", + "id": "llama-3.1-8b-instruct", + "name": "Llama-3.1-8B-Instruct", + "display_name": "Llama-3.1-8B-Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-08", - "release_date": "2024-02-29", - "last_updated": "2024-02-29", + "attachment": false, + "open_weights": true, + "release_date": "2025-06-11", + "last_updated": "2025-06-11", "cost": { - "input": 15, - "output": 75 - }, - "type": "chat" + "input": 0.11, + "output": 0.11 + } }, { - "id": "amazon.nova-pro-v1:0", - "name": "Nova Pro", - "display_name": "Nova Pro", + "id": "qwen2.5-vl-72b-instruct", + "name": "Qwen2.5-VL-72B-Instruct", + "display_name": "Qwen2.5-VL-72B-Instruct", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 300000, - "output": 8192 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "open_weights": true, + "release_date": "2025-03-31", + "last_updated": "2025-03-31", "cost": { - "input": 0.8, - "output": 3.2, - "cache_read": 0.2 - }, - "type": "chat" + "input": 1.01, + "output": 1.01 + } }, { - "id": "meta.llama3-1-8b-instruct-v1:0", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "mistral-nemo-instruct-2407", + "name": "Mistral-Nemo-Instruct-2407", + "display_name": "Mistral-Nemo-Instruct-2407", "modalities": { "input": [ "text" @@ -56694,8 +54744,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 65536, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -56704,50 +54754,48 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2024-11-20", + "last_updated": "2024-11-20", "cost": { - "input": 0.22, - "output": 0.22 - }, - "type": "chat" + "input": 0.14, + "output": 0.14 + } }, { - "id": "openai.gpt-oss-120b-1:0", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "mistral-small-3.2-24b-instruct-2506", + "name": "Mistral-Small-3.2-24B-Instruct-2506", + "display_name": "Mistral-Small-3.2-24B-Instruct-2506", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "attachment": true, + "open_weights": true, + "release_date": "2025-07-16", + "last_updated": "2025-07-16", "cost": { - "input": 0.15, - "output": 0.6 - }, - "type": "chat" - }, - { - "id": "qwen.qwen3-32b-v1:0", - "name": "Qwen3 32B (dense)", - "display_name": "Qwen3 32B (dense)", + "input": 0.1, + "output": 0.31 + } + }, + { + "id": "qwen2.5-coder-32b-instruct", + "name": "Qwen2.5-Coder-32B-Instruct", + "display_name": "Qwen2.5-Coder-32B-Instruct", "modalities": { "input": [ "text" @@ -56757,79 +54805,68 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 0.15, - "output": 0.6 - }, - "type": "chat" + "input": 0.96, + "output": 0.96 + } }, { - "id": "anthropic.claude-3-5-sonnet-20240620-v1:0", - "name": "Claude Sonnet 3.5", - "display_name": "Claude Sonnet 3.5", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder-30B-A3B-Instruct", + "display_name": "Qwen3-Coder-30B-A3B-Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-06-20", - "last_updated": "2024-06-20", + "attachment": false, + "open_weights": true, + "release_date": "2025-10-28", + "last_updated": "2025-10-28", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0.07, + "output": 0.26 + } }, { - "id": "anthropic.claude-haiku-4-5-20251001-v1:0", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "deepseek-r1-distill-llama-70b", + "name": "DeepSeek-R1-Distill-Llama-70B", + "display_name": "DeepSeek-R1-Distill-Llama-70B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -56837,23 +54874,19 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "release_date": "2025-01-30", + "last_updated": "2025-01-30", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 - }, - "type": "chat" + "input": 0.74, + "output": 0.74 + } }, { - "id": "cohere.command-r-v1:0", - "name": "Command R", - "display_name": "Command R", + "id": "gpt-oss-20b", + "name": "gpt-oss-20b", + "display_name": "gpt-oss-20b", "modalities": { "input": [ "text" @@ -56863,61 +54896,57 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-03-11", - "last_updated": "2024-03-11", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 0.5, - "output": 1.5 - }, - "type": "chat" + "input": 0.05, + "output": 0.18 + } }, { - "id": "mistral.voxtral-small-24b-2507", - "name": "Voxtral Small 24B 2507", - "display_name": "Voxtral Small 24B 2507", + "id": "gpt-oss-120b", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ - "text", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 131072, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 0.15, - "output": 0.35 - }, - "type": "chat" + "input": 0.09, + "output": 0.47 + } }, { - "id": "amazon.nova-micro-v1:0", - "name": "Nova Micro", - "display_name": "Nova Micro", + "id": "meta-llama-3_3-70b-instruct", + "name": "Meta-Llama-3_3-70B-Instruct", + "display_name": "Meta-Llama-3_3-70B-Instruct", "modalities": { "input": [ "text" @@ -56927,8 +54956,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -56936,21 +54965,18 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "open_weights": true, + "release_date": "2025-04-01", + "last_updated": "2025-04-01", "cost": { - "input": 0.035, - "output": 0.14, - "cache_read": 0.00875 - }, - "type": "chat" + "input": 0.74, + "output": 0.74 + } }, { - "id": "meta.llama3-1-70b-instruct-v1:0", - "name": "Llama 3.1 70B Instruct", - "display_name": "Llama 3.1 70B Instruct", + "id": "qwen3-32b", + "name": "Qwen3-32B", + "display_name": "Qwen3-32B", "modalities": { "input": [ "text" @@ -56960,64 +54986,72 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2025-07-16", + "last_updated": "2025-07-16", "cost": { - "input": 0.72, - "output": 0.72 - }, - "type": "chat" - }, + "input": 0.09, + "output": 0.25 + } + } + ] + }, + "v0": { + "id": "v0", + "name": "v0", + "display_name": "v0", + "doc": "https://sdk.vercel.ai/providers/ai-sdk-providers/vercel", + "models": [ { - "id": "meta.llama3-70b-instruct-v1:0", - "name": "Llama 3 70B Instruct", - "display_name": "Llama 3 70B Instruct", + "id": "v0-1.5-lg", + "name": "v0-1.5-lg", + "display_name": "v0-1.5-lg", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 512000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "attachment": true, + "open_weights": false, + "release_date": "2025-06-09", + "last_updated": "2025-06-09", "cost": { - "input": 2.65, - "output": 3.5 - }, - "type": "chat" + "input": 15, + "output": 75 + } }, { - "id": "deepseek.r1-v1:0", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "v0-1.5-md", + "name": "v0-1.5-md", + "display_name": "v0-1.5-md", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -57025,7 +55059,7 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 32000 }, "temperature": true, "tool_call": true, @@ -57033,57 +55067,91 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-05-29", + "release_date": "2025-06-09", + "last_updated": "2025-06-09", "cost": { - "input": 1.35, - "output": 5.4 - }, - "type": "chat" + "input": 3, + "output": 15 + } }, { - "id": "anthropic.claude-3-5-sonnet-20241022-v2:0", - "name": "Claude Sonnet 3.5 v2", - "display_name": "Claude Sonnet 3.5 v2", + "id": "v0-1.0-md", + "name": "v0-1.0-md", + "display_name": "v0-1.0-md", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "output": 15 + } + } + ] + }, + "iflowcn": { + "id": "iflowcn", + "name": "iFlow", + "display_name": "iFlow", + "api": "https://apis.iflow.cn/v1", + "doc": "https://platform.iflow.cn/en/docs", + "models": [ + { + "id": "deepseek-v3", + "name": "DeepSeek-V3", + "display_name": "DeepSeek-V3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] }, - "type": "chat" + "limit": { + "context": 128000, + "output": 32000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-12-26", + "last_updated": "2024-12-26", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "mistral.ministral-3-8b-instruct", - "name": "Ministral 3 8B", - "display_name": "Ministral 3 8B", + "id": "kimi-k2", + "name": "Kimi-K2", + "display_name": "Kimi-K2", "modalities": { "input": [ "text" @@ -57094,7 +55162,7 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 64000 }, "temperature": true, "tool_call": true, @@ -57103,18 +55171,18 @@ }, "attachment": false, "open_weights": false, + "knowledge": "2024-10", "release_date": "2024-12-01", "last_updated": "2024-12-01", "cost": { - "input": 0.15, - "output": 0.15 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "cohere.command-text-v14", - "name": "Command", - "display_name": "Command", + "id": "deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ "text" @@ -57124,41 +55192,39 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 128000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-08", - "release_date": "2023-11-01", - "last_updated": "2023-11-01", + "knowledge": "2024-12", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 1.5, - "output": 2 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "anthropic.claude-opus-4-20250514-v1:0", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "qwen3-235b", + "name": "Qwen3-235B-A22B", + "display_name": "Qwen3-235B-A22B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 128000, "output": 32000 }, "temperature": true, @@ -57167,26 +55233,22 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "mistral.voxtral-mini-3b-2507", - "name": "Voxtral Mini 3B 2507", - "display_name": "Voxtral Mini 3B 2507", + "id": "kimi-k2-0905", + "name": "Kimi-K2-0905", + "display_name": "Kimi-K2-0905", "modalities": { "input": [ - "audio", "text" ], "output": [ @@ -57194,8 +55256,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -57204,30 +55266,28 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2024-12", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.04, - "output": 0.04 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "global.anthropic.claude-opus-4-5-20251101-v1:0", - "name": "Claude Opus 4.5 (Global)", - "display_name": "Claude Opus 4.5 (Global)", + "id": "qwen3-235b-a22b-thinking-2507", + "name": "Qwen3-235B-A22B-Thinking", + "display_name": "Qwen3-235B-A22B-Thinking", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 256000, "output": 64000 }, "temperature": true, @@ -57236,56 +55296,52 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 5, - "output": 25, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "amazon.nova-2-lite-v1:0", - "name": "Nova 2 Lite", - "display_name": "Nova 2 Lite", + "id": "qwen3-vl-plus", + "name": "Qwen3-VL-Plus", + "display_name": "Qwen3-VL-Plus", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.33, - "output": 2.75 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "qwen.qwen3-coder-480b-a35b-v1:0", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" @@ -57295,66 +55351,60 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", - "cost": { - "input": 0.22, - "output": 1.8 - }, - "type": "chat" + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2025-11-13", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "anthropic.claude-sonnet-4-5-20250929-v1:0", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "qwen3-235b-a22b-instruct", + "name": "Qwen3-235B-A22B-Instruct", + "display_name": "Qwen3-235B-A22B-Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 256000, "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "openai.gpt-oss-safeguard-20b", - "name": "GPT OSS Safeguard 20B", - "display_name": "GPT OSS Safeguard 20B", + "id": "qwen3-max", + "name": "Qwen3-Max", + "display_name": "Qwen3-Max", "modalities": { "input": [ "text" @@ -57364,8 +55414,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -57374,18 +55424,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.07, - "output": 0.2 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "openai.gpt-oss-20b-1:0", - "name": "gpt-oss-20b", - "display_name": "gpt-oss-20b", + "id": "deepseek-v3.2", + "name": "DeepSeek-V3.2-Exp", + "display_name": "DeepSeek-V3.2-Exp", "modalities": { "input": [ "text" @@ -57396,7 +55446,7 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 64000 }, "temperature": true, "tool_call": true, @@ -57404,19 +55454,19 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.07, - "output": 0.3 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "meta.llama3-2-3b-instruct-v1:0", - "name": "Llama 3.2 3B Instruct", - "display_name": "Llama 3.2 3B Instruct", + "id": "qwen3-max-preview", + "name": "Qwen3-Max-Preview", + "display_name": "Qwen3-Max-Preview", "modalities": { "input": [ "text" @@ -57426,8 +55476,8 @@ ] }, "limit": { - "context": 131000, - "output": 4096 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -57435,20 +55485,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.15, - "output": 0.15 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "anthropic.claude-instant-v1", - "name": "Claude Instant", - "display_name": "Claude Instant", + "id": "qwen3-coder-plus", + "name": "Qwen3-Coder-Plus", + "display_name": "Qwen3-Coder-Plus", "modalities": { "input": [ "text" @@ -57458,64 +55507,68 @@ ] }, "limit": { - "context": 100000, - "output": 4096 + "context": 256000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2023-08", - "release_date": "2023-03-01", - "last_updated": "2023-03-01", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 0.8, - "output": 2.4 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "amazon.nova-premier-v1:0", - "name": "Nova Premier", - "display_name": "Nova Premier", + "id": "qwen3-32b", + "name": "Qwen3-32B", + "display_name": "Qwen3-32B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 16384 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, + "attachment": false, + "open_weights": true, "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 2.5, - "output": 12.5 - }, - "type": "chat" - }, + "input": 0, + "output": 0 + } + } + ] + }, + "synthetic": { + "id": "synthetic", + "name": "Synthetic", + "display_name": "Synthetic", + "api": "https://api.synthetic.new/v1", + "doc": "https://synthetic.new/pricing", + "models": [ { - "id": "mistral.mistral-7b-instruct-v0:2", - "name": "Mistral-7B-Instruct-v0.3", - "display_name": "Mistral-7B-Instruct-v0.3", + "id": "hf:Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen 3 235B Instruct", + "display_name": "Qwen 3 235B Instruct", "modalities": { "input": [ "text" @@ -57525,8 +55578,8 @@ ] }, "limit": { - "context": 127000, - "output": 127000 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -57535,18 +55588,18 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-04-01", - "last_updated": "2025-04-01", + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2025-07-21", "cost": { - "input": 0.11, - "output": 0.11 - }, - "type": "chat" + "input": 0.2, + "output": 0.6 + } }, { - "id": "mistral.mixtral-8x7b-instruct-v0:1", - "name": "Mixtral-8x7B-Instruct-v0.1", - "display_name": "Mixtral-8x7B-Instruct-v0.1", + "id": "hf:Qwen/Qwen2.5-Coder-32B-Instruct", + "name": "Qwen2.5-Coder-32B-Instruct", + "display_name": "Qwen2.5-Coder-32B-Instruct", "modalities": { "input": [ "text" @@ -57556,8 +55609,8 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": false, @@ -57566,88 +55619,81 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-04-01", - "last_updated": "2025-04-01", + "knowledge": "2024-10", + "release_date": "2024-11-11", + "last_updated": "2024-11-11", "cost": { - "input": 0.7, - "output": 0.7 - }, - "type": "chat" + "input": 0.8, + "output": 0.8 + } }, { - "id": "anthropic.claude-opus-4-1-20250805-v1:0", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "hf:Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen 3 Coder 480B", + "display_name": "Qwen 3 Coder 480B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 256000, "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" + "input": 2, + "output": 2 + } }, { - "id": "meta.llama4-scout-17b-instruct-v1:0", - "name": "Llama 4 Scout 17B Instruct", - "display_name": "Llama 4 Scout 17B Instruct", + "id": "hf:Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 3500000, - "output": 16384 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 0.17, - "output": 0.66 - }, - "type": "chat" + "input": 0.65, + "output": 3 + } }, { - "id": "ai21.jamba-1-5-mini-v1:0", - "name": "Jamba 1.5 Mini", - "display_name": "Jamba 1.5 Mini", + "id": "hf:MiniMaxAI/MiniMax-M2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ "text" @@ -57657,29 +55703,28 @@ ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 196608, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 0.2, - "output": 0.4 - }, - "type": "chat" + "input": 0.55, + "output": 2.19 + } }, { - "id": "meta.llama3-8b-instruct-v1:0", - "name": "Llama 3 8B Instruct", - "display_name": "Llama 3 8B Instruct", + "id": "hf:MiniMaxAI/MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" @@ -57689,29 +55734,28 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 204800, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-03", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.3, - "output": 0.6 - }, - "type": "chat" + "input": 0.55, + "output": 2.19 + } }, { - "id": "amazon.titan-text-express-v1:0:8k", - "name": "Titan Text G1 - Express", - "display_name": "Titan Text G1 - Express", + "id": "hf:meta-llama/Llama-3.1-70B-Instruct", + "name": "Llama-3.1-70B-Instruct", + "display_name": "Llama-3.1-70B-Instruct", "modalities": { "input": [ "text" @@ -57722,61 +55766,60 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.2, - "output": 0.6 - }, - "type": "chat" + "input": 0.9, + "output": 0.9 + } }, { - "id": "anthropic.claude-3-sonnet-20240229-v1:0", - "name": "Claude Sonnet 3", - "display_name": "Claude Sonnet 3", + "id": "hf:meta-llama/Llama-3.1-8B-Instruct", + "name": "Llama-3.1-8B-Instruct", + "display_name": "Llama-3.1-8B-Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-08", - "release_date": "2024-03-04", - "last_updated": "2024-03-04", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 3, - "output": 15 - }, - "type": "chat" + "input": 0.2, + "output": 0.2 + } }, { - "id": "nvidia.nemotron-nano-9b-v2", - "name": "NVIDIA Nemotron Nano 9B v2", - "display_name": "NVIDIA Nemotron Nano 9B v2", + "id": "hf:meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -57787,37 +55830,39 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.06, - "output": 0.23 - }, - "type": "chat" + "input": 0.9, + "output": 0.9 + } }, { - "id": "amazon.titan-text-express-v1", - "name": "Titan Text G1 - Express", - "display_name": "Titan Text G1 - Express", + "id": "hf:meta-llama/Llama-4-Scout-17B-16E-Instruct", + "name": "Llama-4-Scout-17B-16E-Instruct", + "display_name": "Llama-4-Scout-17B-16E-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 328000, "output": 4096 }, "temperature": true, @@ -57825,20 +55870,20 @@ "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.2, + "input": 0.15, "output": 0.6 - }, - "type": "chat" + } }, { - "id": "meta.llama4-maverick-17b-instruct-v1:0", - "name": "Llama 4 Maverick 17B Instruct", - "display_name": "Llama 4 Maverick 17B Instruct", + "id": "hf:meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", + "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", "modalities": { "input": [ "text", @@ -57849,8 +55894,8 @@ ] }, "limit": { - "context": 1000000, - "output": 16384 + "context": 524000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -57863,15 +55908,14 @@ "release_date": "2025-04-05", "last_updated": "2025-04-05", "cost": { - "input": 0.24, - "output": 0.97 - }, - "type": "chat" + "input": 0.22, + "output": 0.88 + } }, { - "id": "mistral.ministral-3-14b-instruct", - "name": "Ministral 14B 3.0", - "display_name": "Ministral 14B 3.0", + "id": "hf:meta-llama/Llama-3.1-405B-Instruct", + "name": "Llama-3.1-405B-Instruct", + "display_name": "Llama-3.1-405B-Instruct", "modalities": { "input": [ "text" @@ -57882,58 +55926,61 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.2, - "output": 0.2 - }, - "type": "chat" + "input": 3, + "output": 3 + } }, { - "id": "openai.gpt-oss-safeguard-120b", - "name": "GPT OSS Safeguard 120B", - "display_name": "GPT OSS Safeguard 120B", + "id": "hf:moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.15, - "output": 0.6 - }, - "type": "chat" + "input": 0.55, + "output": 2.19 + } }, { - "id": "qwen.qwen3-235b-a22b-2507-v1:0", - "name": "Qwen3 235B A22B 2507", - "display_name": "Qwen3 235B A22B 2507", + "id": "hf:moonshotai/Kimi-K2-Instruct-0905", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ "text" @@ -57944,7 +55991,7 @@ }, "limit": { "context": 262144, - "output": 131072 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -57953,59 +56000,85 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.22, - "output": 0.88 - }, - "type": "chat" + "input": 1.2, + "output": 1.2 + } }, { - "id": "amazon.nova-lite-v1:0", - "name": "Nova Lite", - "display_name": "Nova Lite", + "id": "hf:moonshotai/Kimi-K2-Thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 300000, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "attachment": false, + "open_weights": true, + "knowledge": "2025-11", + "release_date": "2025-11-07", + "last_updated": "2025-11-07", "cost": { - "input": 0.06, - "output": 0.24, - "cache_read": 0.015 + "input": 0.55, + "output": 2.19 + } + }, + { + "id": "hf:zai-org/GLM-4.5", + "name": "GLM 4.5", + "display_name": "GLM 4.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] }, - "type": "chat" + "limit": { + "context": 128000, + "output": 96000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "cost": { + "input": 0.55, + "output": 2.19 + } }, { - "id": "anthropic.claude-3-5-haiku-20241022-v1:0", - "name": "Claude Haiku 3.5", - "display_name": "Claude Haiku 3.5", + "id": "hf:zai-org/GLM-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -58013,30 +56086,28 @@ }, "limit": { "context": 200000, - "output": 8192 + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 - }, - "type": "chat" + "input": 0.55, + "output": 2.19 + } }, { - "id": "moonshot.kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "hf:zai-org/GLM-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ "text" @@ -58046,8 +56117,8 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -58057,157 +56128,145 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.6, - "output": 2.5 - }, - "type": "chat" - } - ] - }, - "poe": { - "id": "poe", - "name": "Poe", - "display_name": "Poe", - "api": "https://api.poe.com/v1", - "doc": "https://creator.poe.com/docs/external-applications/openai-compatible-api", - "models": [ + "input": 0.55, + "output": 2.19 + } + }, { - "id": "xai/grok-4-fast-non-reasoning", - "name": "Grok-4-Fast-Non-Reasoning", - "display_name": "Grok-4-Fast-Non-Reasoning", + "id": "hf:deepseek-ai/DeepSeek-R1", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, + "context": 128000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-16", - "last_updated": "2025-09-16", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 - }, - "type": "chat" + "input": 0.55, + "output": 2.19 + } }, { - "id": "xai/grok-4-fast-reasoning", - "name": "Grok 4 Fast Reasoning", - "display_name": "Grok 4 Fast Reasoning", + "id": "hf:deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek R1 (0528)", + "display_name": "DeepSeek R1 (0528)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, + "context": 128000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-16", - "last_updated": "2025-09-16", + "release_date": "2025-08-01", + "last_updated": "2025-08-01", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 - }, - "type": "chat" + "input": 3, + "output": 8 + } }, { - "id": "xai/grok-4.1-fast-reasoning", - "name": "Grok-4.1-Fast-Reasoning", - "display_name": "Grok-4.1-Fast-Reasoning", + "id": "hf:deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "DeepSeek V3.1 Terminus", + "display_name": "DeepSeek V3.1 Terminus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 128000, + "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-19", - "last_updated": "2025-11-19", - "type": "chat" + "release_date": "2025-09-22", + "last_updated": "2025-09-25", + "cost": { + "input": 1.2, + "output": 1.2 + } }, { - "id": "xai/grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "hf:deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 162816, + "output": 8000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-07-10", - "last_updated": "2025-07-10", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 - }, - "type": "chat" + "input": 0.27, + "output": 0.4, + "cache_read": 0.27, + "cache_write": 0 + } }, { - "id": "xai/grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "hf:deepseek-ai/DeepSeek-V3", + "name": "DeepSeek V3", + "display_name": "DeepSeek V3", "modalities": { "input": [ "text" @@ -58217,58 +56276,60 @@ ] }, "limit": { - "context": 256000, + "context": 128000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-22", - "last_updated": "2025-08-22", + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-29", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 - }, - "type": "chat" + "input": 1.25, + "output": 1.25 + } }, { - "id": "xai/grok-4.1-fast-non-reasoning", - "name": "Grok-4.1-Fast-Non-Reasoning", - "display_name": "Grok-4.1-Fast-Non-Reasoning", + "id": "hf:deepseek-ai/DeepSeek-V3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 128000, + "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-19", - "last_updated": "2025-11-19", - "type": "chat" + "release_date": "2025-08-21", + "last_updated": "2025-08-21", + "cost": { + "input": 0.56, + "output": 1.68 + } }, { - "id": "xai/grok-3", - "name": "Grok 3", - "display_name": "Grok 3", + "id": "hf:deepseek-ai/DeepSeek-V3-0324", + "name": "DeepSeek V3 (0324)", + "display_name": "DeepSeek V3 (0324)", "modalities": { "input": [ "text" @@ -58278,29 +56339,27 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-04-11", - "last_updated": "2025-04-11", + "release_date": "2025-08-01", + "last_updated": "2025-08-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 - }, - "type": "chat" + "input": 1.2, + "output": 1.2 + } }, { - "id": "xai/grok-3-mini", - "name": "Grok 3 Mini", - "display_name": "Grok 3 Mini", + "id": "hf:openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -58310,196 +56369,194 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-04-11", - "last_updated": "2025-04-11", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.3, - "output": 0.5, - "cache_read": 0.075 - }, - "type": "chat" - }, + "input": 0.1, + "output": 0.1 + } + } + ] + }, + "deepinfra": { + "id": "deepinfra", + "name": "Deep Infra", + "display_name": "Deep Infra", + "doc": "https://deepinfra.com/models", + "models": [ { - "id": "ideogramai/ideogram", - "name": "Ideogram", - "display_name": "Ideogram", + "id": "moonshotai/Kimi-K2-Instruct", + "name": "Kimi K2", + "display_name": "Kimi K2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 150, - "output": 8192 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-04-03", - "last_updated": "2024-04-03", - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-11", + "last_updated": "2025-07-11", + "cost": { + "input": 0.5, + "output": 2 + } }, { - "id": "ideogramai/ideogram-v2a", - "name": "Ideogram-v2a", - "display_name": "Ideogram-v2a", + "id": "moonshotai/Kimi-K2-Thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 150, - "output": 8192 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-02-27", - "last_updated": "2025-02-27", - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-11-06", + "last_updated": "2025-11-07", + "cost": { + "input": 0.47, + "output": 2 + } }, { - "id": "ideogramai/ideogram-v2a-turbo", - "name": "Ideogram-v2a-Turbo", - "display_name": "Ideogram-v2a-Turbo", + "id": "MiniMaxAI/MiniMax-M2", + "name": "MiniMax M2", + "display_name": "MiniMax M2", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 150, - "output": 8192 + "context": 262144, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-02-27", - "last_updated": "2025-02-27", - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "cost": { + "input": 0.254, + "output": 1.02 + } }, { - "id": "ideogramai/ideogram-v2", - "name": "Ideogram-v2", - "display_name": "Ideogram-v2", + "id": "MiniMaxAI/MiniMax-M2.1", + "name": "MiniMax M2.1", + "display_name": "MiniMax M2.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 150, - "output": 8192 + "context": 196608, + "output": 196608 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2024-08-21", - "last_updated": "2024-08-21", - "type": "chat" - }, - { - "id": "runwayml/runway", - "name": "Runway", - "display_name": "Runway", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "video" - ] - }, - "limit": { - "context": 256, - "output": 8192 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2024-10-11", - "last_updated": "2024-10-11", - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "cost": { + "input": 0.28, + "output": 1.2 + } }, { - "id": "runwayml/runway-gen-4-turbo", - "name": "Runway-Gen-4-Turbo", - "display_name": "Runway-Gen-4-Turbo", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 256, - "output": 8192 + "context": 131072, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-09", - "last_updated": "2025-05-09", - "type": "chat" + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0.03, + "output": 0.14 + } }, { - "id": "poetools/claude-code", - "name": "claude-code", - "display_name": "claude-code", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -58509,788 +56566,857 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131072, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-27", - "last_updated": "2025-11-27", - "type": "chat" + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0.05, + "output": 0.24 + } }, { - "id": "elevenlabs/elevenlabs-v3", - "name": "ElevenLabs-v3", - "display_name": "ElevenLabs-v3", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 66536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2025-06-05", - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "cost": { + "input": 0.4, + "output": 1.6 + } }, { - "id": "elevenlabs/elevenlabs-music", - "name": "ElevenLabs-Music", - "display_name": "ElevenLabs-Music", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo", + "name": "Qwen3 Coder 480B A35B Instruct Turbo", + "display_name": "Qwen3 Coder 480B A35B Instruct Turbo", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 2000, - "output": 8192 + "context": 262144, + "output": 66536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-29", - "last_updated": "2025-08-29", - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "cost": { + "input": 0.3, + "output": 1.2 + } }, { - "id": "elevenlabs/elevenlabs-v2.5-turbo", - "name": "ElevenLabs-v2.5-Turbo", - "display_name": "ElevenLabs-v2.5-Turbo", + "id": "zai-org/GLM-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 98304 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-10-28", - "last_updated": "2024-10-28", - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "cost": { + "input": 0.6, + "output": 2.2 + } }, { - "id": "google/gemini-deep-research", - "name": "gemini-deep-research", - "display_name": "gemini-deep-research", + "id": "zai-org/GLM-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 202752, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 1.6, - "output": 9.6 - }, - "type": "chat" + "input": 0.43, + "output": 1.75, + "cache_read": 0.08 + } }, { - "id": "google/nano-banana", - "name": "Nano-Banana", - "display_name": "Nano-Banana", + "id": "zai-org/GLM-4.7-Flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 202752, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.21, - "output": 1.8, - "cache_read": 0.021 - }, - "type": "chat" - }, + "input": 0.06, + "output": 0.4 + } + } + ] + }, + "zhipuai": { + "id": "zhipuai", + "name": "Zhipu AI", + "display_name": "Zhipu AI", + "api": "https://open.bigmodel.cn/api/paas/v4", + "doc": "https://docs.z.ai/guides/overview/pricing", + "models": [ { - "id": "google/imagen-4", - "name": "Imagen-4", - "display_name": "Imagen-4", + "id": "glm-4.6v", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 128000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "type": "chat" + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", + "cost": { + "input": 0.3, + "output": 0.9 + } }, { - "id": "google/imagen-3", - "name": "Imagen-3", - "display_name": "Imagen-3", + "id": "glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2024-10-15", - "last_updated": "2024-10-15", - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", + "cost": { + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 + } }, { - "id": "google/imagen-4-ultra", - "name": "Imagen-4-Ultra", - "display_name": "Imagen-4-Ultra", + "id": "glm-4.5v", + "name": "GLM-4.5V", + "display_name": "GLM-4.5V", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 64000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": false, - "release_date": "2025-05-24", - "last_updated": "2025-05-24", - "type": "chat" + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", + "cost": { + "input": 0.6, + "output": 1.8 + } }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1065535, - "output": 65535 + "context": 131072, + "output": 98304 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-04-26", - "last_updated": "2025-04-26", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.21, - "output": 1.8, - "cache_read": 0.021 - }, - "type": "chat" + "input": 0.2, + "output": 1.1, + "cache_read": 0.03, + "cache_write": 0 + } }, { - "id": "google/gemini-2.0-flash-lite", - "name": "Gemini-2.0-Flash-Lite", - "display_name": "Gemini-2.0-Flash-Lite", + "id": "glm-4.7-flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 990000, - "output": 8192 + "context": 200000, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2025-02-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.052, - "output": 0.21 - }, - "type": "chat" + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } }, { - "id": "google/gemini-3-pro", - "name": "Gemini-3-Pro", - "display_name": "Gemini-3-Pro", + "id": "glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 64000 + "context": 131072, + "output": 98304 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-22", - "last_updated": "2025-10-22", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 1.6, - "output": 9.6, - "cache_read": 0.16 - }, - "type": "chat" + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 + } }, { - "id": "google/veo-3.1", - "name": "Veo-3.1", - "display_name": "Veo-3.1", + "id": "glm-4.5-flash", + "name": "GLM-4.5-Flash", + "display_name": "GLM-4.5-Flash", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 131072, + "output": 98304 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-10-15", - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } }, { - "id": "google/imagen-3-fast", - "name": "Imagen-3-Fast", - "display_name": "Imagen-3-Fast", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2024-10-17", - "last_updated": "2024-10-17", - "type": "chat" - }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "cost": { + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 + } + } + ] + }, + "submodel": { + "id": "submodel", + "name": "submodel", + "display_name": "submodel", + "api": "https://llm.submodel.ai/v1", + "doc": "https://submodel.gitbook.io", + "models": [ { - "id": "google/lyria", - "name": "Lyria", - "display_name": "Lyria", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-06-04", - "last_updated": "2025-06-04", - "type": "chat" + "attachment": false, + "open_weights": true, + "release_date": "2025-08-23", + "last_updated": "2025-08-23", + "cost": { + "input": 0.1, + "output": 0.5 + } }, { - "id": "google/gemini-2.0-flash", - "name": "Gemini-2.0-Flash", - "display_name": "Gemini-2.0-Flash", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 990000, - "output": 8192 + "context": 262144, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { - "input": 0.1, - "output": 0.42 - }, - "type": "chat" + "input": 0.2, + "output": 0.3 + } }, { - "id": "google/gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash Lite", - "display_name": "Gemini 2.5 Flash Lite", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1024000, - "output": 64000 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-06-19", - "last_updated": "2025-06-19", + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { - "input": 0.07, - "output": 0.28 - }, - "type": "chat" + "input": 0.2, + "output": 0.8 + } }, { - "id": "google/veo-3", - "name": "Veo-3", - "display_name": "Veo-3", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 262144, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-21", - "last_updated": "2025-05-21", - "type": "chat" + "attachment": false, + "open_weights": true, + "release_date": "2025-08-23", + "last_updated": "2025-08-23", + "cost": { + "input": 0.2, + "output": 0.6 + } }, { - "id": "google/veo-3-fast", - "name": "Veo-3-Fast", - "display_name": "Veo-3-Fast", + "id": "zai-org/GLM-4.5-FP8", + "name": "GLM 4.5 FP8", + "display_name": "GLM 4.5 FP8", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 131072, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-13", - "last_updated": "2025-10-13", - "type": "chat" + "attachment": false, + "open_weights": true, + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "cost": { + "input": 0.2, + "output": 0.8 + } }, { - "id": "google/imagen-4-fast", - "name": "Imagen-4-Fast", - "display_name": "Imagen-4-Fast", + "id": "zai-org/GLM-4.5-Air", + "name": "GLM 4.5 Air", + "display_name": "GLM 4.5 Air", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 131072, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-06-25", - "last_updated": "2025-06-25", - "type": "chat" + "attachment": false, + "open_weights": true, + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "cost": { + "input": 0.1, + "output": 0.5 + } }, { - "id": "google/veo-2", - "name": "Veo-2", - "display_name": "Veo-2", + "id": "deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek R1 0528", + "display_name": "DeepSeek R1 0528", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 75000, + "output": 163840 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-12-02", - "last_updated": "2024-12-02", - "type": "chat" + "release_date": "2025-08-23", + "last_updated": "2025-08-23", + "cost": { + "input": 0.5, + "output": 2.15 + } }, { - "id": "google/gemini-3-flash", - "name": "gemini-3-flash", - "display_name": "gemini-3-flash", + "id": "deepseek-ai/DeepSeek-V3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 75000, + "output": 163840 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-07", - "last_updated": "2025-10-07", + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { - "input": 0.4, - "output": 2.4, - "cache_read": 0.04 - }, - "type": "chat" + "input": 0.2, + "output": 0.8 + } }, { - "id": "google/nano-banana-pro", - "name": "Nano-Banana-Pro", - "display_name": "Nano-Banana-Pro", + "id": "deepseek-ai/DeepSeek-V3-0324", + "name": "DeepSeek V3 0324", + "display_name": "DeepSeek V3 0324", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 75000, + "output": 163840 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { - "input": 1.7, - "output": 10, - "cache_read": 0.17 - }, - "type": "chat" - }, + "input": 0.2, + "output": 0.8 + } + } + ] + }, + "nano-gpt": { + "id": "nano-gpt", + "name": "NanoGPT", + "display_name": "NanoGPT", + "api": "https://nano-gpt.com/api/v1", + "doc": "https://docs.nano-gpt.com", + "models": [ { - "id": "google/gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1065535, - "output": 65535 + "context": 32768, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2025-02-05", + "knowledge": "2024-08", + "release_date": "2024-11-01", + "last_updated": "2025-12-24", "cost": { - "input": 0.87, - "output": 7, - "cache_read": 0.087 - }, - "type": "chat" + "input": 1, + "output": 2 + } }, { - "id": "google/veo-3.1-fast", - "name": "Veo-3.1-Fast", - "display_name": "Veo-3.1-Fast", + "id": "moonshotai/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 480, + "context": 131072, "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-10-15", - "type": "chat" + "knowledge": "2024-10", + "release_date": "2024-07-18", + "last_updated": "2025-12-24", + "cost": { + "input": 1, + "output": 2 + } }, { - "id": "openai/gpt-4.1-nano", - "name": "GPT-4.1-nano", - "display_name": "GPT-4.1-nano", + "id": "nousresearch/hermes-4-405b:thinking", + "name": "Hermes 4 405b Thinking", + "display_name": "Hermes 4 405b Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "attachment": false, + "open_weights": true, + "release_date": "2024-08-13", + "last_updated": "2025-12-24", "cost": { - "input": 0.09, - "output": 0.36, - "cache_read": 0.022 - }, - "type": "chat" + "input": 1, + "output": 2 + } }, { - "id": "openai/gpt-5.2-instant", - "name": "gpt-5.2-instant", - "display_name": "gpt-5.2-instant", + "id": "nvidia/llama-3_3-nemotron-super-49b-v1_5", + "name": "Llama 3 3 Nemotron Super 49B V1 5", + "display_name": "Llama 3 3 Nemotron Super 49B V1 5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -59298,253 +57424,243 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-08", + "last_updated": "2025-12-24", "cost": { - "input": 1.6, - "output": 13, - "cache_read": 0.16 - }, - "type": "chat" + "input": 1, + "output": 2 + } }, { - "id": "openai/sora-2", - "name": "Sora-2", - "display_name": "Sora-2", + "id": "deepseek/deepseek-v3.2:thinking", + "name": "Deepseek V3.2 Thinking", + "display_name": "Deepseek V3.2 Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, + "context": 128000, "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-06", - "last_updated": "2025-10-06", - "type": "chat" + "attachment": false, + "open_weights": true, + "release_date": "2025-12-01", + "last_updated": "2025-12-24", + "cost": { + "input": 1, + "output": 2 + } }, { - "id": "openai/o1-pro", - "name": "o1-pro", - "display_name": "o1-pro", + "id": "deepseek/deepseek-r1", + "name": "Deepseek R1", + "display_name": "Deepseek R1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-03-19", - "last_updated": "2025-03-19", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-01-20", + "last_updated": "2025-12-24", "cost": { - "input": 140, - "output": 540 - }, - "type": "chat" + "input": 1, + "output": 2 + } }, { - "id": "openai/gpt-5.1-codex", - "name": "GPT-5.1-Codex", - "display_name": "GPT-5.1-Codex", + "id": "minimax/minimax-m2.1", + "name": "Minimax M2.1", + "display_name": "Minimax M2.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-12", - "last_updated": "2025-11-12", + "release_date": "2025-12-23", + "last_updated": "2025-12-24", "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 - }, - "type": "chat" - }, + "input": 1, + "output": 2 + } + }, { - "id": "openai/gpt-3.5-turbo-raw", - "name": "GPT-3.5-Turbo-Raw", - "display_name": "GPT-3.5-Turbo-Raw", + "id": "openai/gpt-oss-120b", + "name": "GPT Oss 120b", + "display_name": "GPT Oss 120b", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 4524, - "output": 2048 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2023-09-27", - "last_updated": "2023-09-27", + "knowledge": "2024-10", + "release_date": "2025-06-23", + "last_updated": "2025-12-24", "cost": { - "input": 0.45, - "output": 1.4 - }, - "type": "chat" + "input": 1, + "output": 2 + } }, { - "id": "openai/gpt-4-classic", - "name": "GPT-4-Classic", - "display_name": "GPT-4-Classic", + "id": "z-ai/glm-4.6:thinking", + "name": "GLM 4.6 Thinking", + "display_name": "GLM 4.6 Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2024-03-25", - "last_updated": "2024-03-25", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-07", + "last_updated": "2025-12-24", "cost": { - "input": 27, - "output": 54 - }, - "type": "chat" + "input": 1, + "output": 2 + } }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT-4.1-mini", - "display_name": "GPT-4.1-mini", + "id": "z-ai/glm-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-11-15", + "last_updated": "2025-12-24", "cost": { - "input": 0.36, - "output": 1.4, - "cache_read": 0.09 - }, - "type": "chat" + "input": 1, + "output": 2 + } }, { - "id": "openai/gpt-5-chat", - "name": "GPT-5-Chat", - "display_name": "GPT-5-Chat", + "id": "qwen/qwen3-coder", + "name": "Qwen3 Coder", + "display_name": "Qwen3 Coder", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 106000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-15", + "last_updated": "2025-12-24", "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 - }, - "type": "chat" + "input": 1, + "output": 2 + } }, { - "id": "openai/o3-deep-research", - "name": "o3-deep-research", - "display_name": "o3-deep-research", + "id": "qwen/qwen3-235b-a22b-thinking-2507", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ "text" @@ -59554,30 +57670,29 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262144, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-06-27", - "last_updated": "2025-06-27", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-07-01", + "last_updated": "2025-12-24", "cost": { - "input": 9, - "output": 36, - "cache_read": 2.2 - }, - "type": "chat" + "input": 1, + "output": 2 + } }, { - "id": "openai/gpt-4o-search", - "name": "GPT-4o-Search", - "display_name": "GPT-4o-Search", + "id": "mistralai/devstral-2-123b-instruct-2512", + "name": "Devstral 2 123b Instruct 2512", + "display_name": "Devstral 2 123b Instruct 2512", "modalities": { "input": [ "text" @@ -59587,186 +57702,185 @@ ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-03-11", - "last_updated": "2025-03-11", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-11", + "last_updated": "2025-12-24", "cost": { - "input": 2.2, - "output": 9 - }, - "type": "chat" + "input": 1, + "output": 2 + } }, { - "id": "openai/gpt-image-1.5", - "name": "gpt-image-1.5", - "display_name": "gpt-image-1.5", + "id": "mistralai/mistral-large-3-675b-instruct-2512", + "name": "Mistral Large 3 675b Instruct 2512", + "display_name": "Mistral Large 3 675b Instruct 2512", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-16", - "last_updated": "2025-12-16", - "type": "imageGeneration" + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-12-02", + "last_updated": "2025-12-24", + "cost": { + "input": 1, + "output": 2 + } }, { - "id": "openai/gpt-image-1-mini", - "name": "GPT-Image-1-Mini", - "display_name": "GPT-Image-1-Mini", + "id": "mistralai/ministral-14b-instruct-2512", + "name": "Ministral 14b Instruct 2512", + "display_name": "Ministral 14b Instruct 2512", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, + "context": 131072, "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-26", - "last_updated": "2025-08-26", - "type": "imageGeneration" + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2025-12-01", + "last_updated": "2025-12-24", + "cost": { + "input": 1, + "output": 2 + } }, { - "id": "openai/gpt-3.5-turbo", - "name": "GPT-3.5-Turbo", - "display_name": "GPT-3.5-Turbo", + "id": "meta-llama/llama-4-maverick", + "name": "Llama 4 Maverick", + "display_name": "Llama 4 Maverick", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 2048 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2023-09-13", - "last_updated": "2023-09-13", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-04-05", + "last_updated": "2025-12-24", "cost": { - "input": 0.45, - "output": 1.4 - }, - "type": "chat" + "input": 1, + "output": 2 + } }, { - "id": "openai/gpt-5.2-pro", - "name": "gpt-5.2-pro", - "display_name": "gpt-5.2-pro", + "id": "meta-llama/llama-3.3-70b-instruct", + "name": "Llama 3.3 70b Instruct", + "display_name": "Llama 3.3 70b Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2025-12-24", "cost": { - "input": 19, - "output": 150 - }, - "type": "chat" + "input": 1, + "output": 2 + } }, { - "id": "openai/o3-mini-high", - "name": "o3-mini-high", - "display_name": "o3-mini-high", + "id": "zai-org/glm-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 204800, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-24", "cost": { - "input": 0.99, - "output": 4 - }, - "type": "chat" + "input": 1, + "output": 2 + } }, { - "id": "openai/chatgpt-4o-latest", - "name": "ChatGPT-4o-Latest", - "display_name": "ChatGPT-4o-Latest", + "id": "zai-org/glm-4.5-air", + "name": "GLM 4.5 Air", + "display_name": "GLM 4.5 Air", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -59776,29 +57890,28 @@ "context": 128000, "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-08-14", - "last_updated": "2024-08-14", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-12-24", "cost": { - "input": 4.5, - "output": 14 - }, - "type": "chat" + "input": 1, + "output": 2 + } }, { - "id": "openai/gpt-4-turbo", - "name": "GPT-4-Turbo", - "display_name": "GPT-4-Turbo", + "id": "zai-org/glm-4.7:thinking", + "name": "GLM 4.7 Thinking", + "display_name": "GLM 4.7 Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -59806,27 +57919,27 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2023-09-13", - "last_updated": "2023-09-13", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-07", + "last_updated": "2025-12-24", "cost": { - "input": 9, - "output": 27 - }, - "type": "chat" + "input": 1, + "output": 2 + } }, { - "id": "openai/gpt-5.1-codex-mini", - "name": "GPT-5.1-Codex-Mini", - "display_name": "GPT-5.1-Codex-Mini", + "id": "zai-org/glm-4.5-air:thinking", + "name": "GLM 4.5 Air Thinking", + "display_name": "GLM 4.5 Air Thinking", "modalities": { "input": [ "text" @@ -59836,553 +57949,579 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-12", - "last_updated": "2025-11-12", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-07", + "last_updated": "2025-12-24", "cost": { - "input": 0.22, - "output": 1.8, - "cache_read": 0.022 - }, - "type": "chat" - }, + "input": 1, + "output": 2 + } + } + ] + }, + "zai": { + "id": "zai", + "name": "Z.AI", + "display_name": "Z.AI", + "api": "https://api.z.ai/api/paas/v4", + "doc": "https://docs.z.ai/guides/overview/pricing", + "models": [ { - "id": "openai/gpt-5.1-instant", - "name": "GPT-5.1-Instant", - "display_name": "GPT-5.1-Instant", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-12", - "last_updated": "2025-11-12", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 - }, - "type": "chat" + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 + } }, { - "id": "openai/o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "glm-4.5-flash", + "name": "GLM-4.5-Flash", + "display_name": "GLM-4.5-Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 98304 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.99, - "output": 4 - }, - "type": "chat" + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } }, { - "id": "openai/gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", - "modalities": { + "id": "glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", + "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 98304 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-12", - "last_updated": "2025-11-12", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 - }, - "type": "chat" + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 + } }, { - "id": "openai/gpt-5-nano", - "name": "GPT-5-nano", - "display_name": "GPT-5-nano", + "id": "glm-4.7-flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.045, - "output": 0.36, - "cache_read": 0.0045 - }, - "type": "chat" + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } }, { - "id": "openai/gpt-5-codex", - "name": "GPT-5-Codex", - "display_name": "GPT-5-Codex", + "id": "glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 98304 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 1.1, - "output": 9 - }, - "type": "chat" + "input": 0.2, + "output": 1.1, + "cache_read": 0.03, + "cache_write": 0 + } }, { - "id": "openai/gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "glm-4.5v", + "name": "GLM-4.5V", + "display_name": "GLM-4.5V", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 64000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2024-05-13", - "type": "chat" + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", + "cost": { + "input": 0.6, + "output": 1.8 + } }, { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 1.8, - "output": 7.2, - "cache_read": 0.45 - }, - "type": "chat" + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 + } }, { - "id": "openai/o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "glm-4.6v", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0.99, - "output": 4, - "cache_read": 0.25 - }, - "type": "chat" - }, + "input": 0.3, + "output": 0.9 + } + } + ] + }, + "berget": { + "id": "berget", + "name": "Berget.AI", + "display_name": "Berget.AI", + "api": "https://api.berget.ai/v1", + "doc": "https://api.berget.ai", + "models": [ { - "id": "openai/o1", - "name": "o1", - "display_name": "o1", + "id": "intfloat/multilingual-e5-large", + "name": "Multilingual-E5-large", + "display_name": "Multilingual-E5-large", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 512, + "output": 1024 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-12-18", - "last_updated": "2024-12-18", + "attachment": false, + "open_weights": true, + "knowledge": "2025-09", + "release_date": "2025-09-11", + "last_updated": "2025-09-11", "cost": { - "input": 14, - "output": 54 - }, - "type": "chat" + "input": 0.02, + "output": 0 + } }, { - "id": "openai/gpt-5-mini", - "name": "GPT-5-mini", - "display_name": "GPT-5-mini", + "id": "intfloat/multilingual-e5-large-instruct", + "name": "Multilingual-E5-large-instruct", + "display_name": "Multilingual-E5-large-instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 512, + "output": 1024 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-06-25", - "last_updated": "2025-06-25", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04-27", + "last_updated": "2025-04-27", "cost": { - "input": 0.22, - "output": 1.8, - "cache_read": 0.022 - }, - "type": "chat" + "input": 0.02, + "output": 0 + } }, { - "id": "openai/gpt-4o-aug", - "name": "GPT-4o-Aug", - "display_name": "GPT-4o-Aug", + "id": "KBLab/kb-whisper-large", + "name": "KB-Whisper-Large", + "display_name": "KB-Whisper-Large", "modalities": { "input": [ - "text", - "image" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 480000, + "output": 4800 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-11-21", - "last_updated": "2024-11-21", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04-27", + "last_updated": "2025-04-27", "cost": { - "input": 2.2, - "output": 9, - "cache_read": 1.1 - }, - "type": "chat" + "input": 3, + "output": 3 + } }, { - "id": "openai/o3-pro", - "name": "o3-pro", - "display_name": "o3-pro", + "id": "BAAI/bge-reranker-v2-m3", + "name": "bge-reranker-v2-m3", + "display_name": "bge-reranker-v2-m3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 512, + "output": 512 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-06-10", - "last_updated": "2025-06-10", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04-23", + "last_updated": "2025-04-23", "cost": { - "input": 18, - "output": 72 - }, - "type": "chat" + "input": 0.1, + "output": 0.1 + } }, { - "id": "openai/gpt-image-1", - "name": "GPT-Image-1", - "display_name": "GPT-Image-1", + "id": "openai/gpt-oss-120b", + "name": "GPT-OSS-120B", + "display_name": "GPT-OSS-120B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "image" + "text" ] }, "limit": { "context": 128000, "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-03-31", - "last_updated": "2025-03-31", - "type": "imageGeneration" + "attachment": false, + "open_weights": true, + "knowledge": "2025-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0.3, + "output": 0.9 + } }, { - "id": "openai/gpt-5.1-codex-max", - "name": "gpt-5.1-codex-max", - "display_name": "gpt-5.1-codex-max", + "id": "mistralai/Mistral-Small-3.2-24B-Instruct-2506", + "name": "Mistral Small 3.2 24B Instruct 2506", + "display_name": "Mistral Small 3.2 24B Instruct 2506", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "attachment": false, + "open_weights": true, + "knowledge": "2025-09", + "release_date": "2025-10-01", + "last_updated": "2025-10-01", "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 - }, - "type": "chat" + "input": 0.3, + "output": 0.3 + } }, { - "id": "openai/gpt-3.5-turbo-instruct", - "name": "GPT-3.5-Turbo-Instruct", - "display_name": "GPT-3.5-Turbo-Instruct", + "id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 3500, - "output": 1024 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2023-09-20", - "last_updated": "2023-09-20", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-04-27", + "last_updated": "2025-04-27", "cost": { - "input": 1.4, - "output": 1.8 - }, - "type": "chat" + "input": 0.9, + "output": 0.9 + } }, { - "id": "openai/o3", - "name": "o3", - "display_name": "o3", + "id": "zai-org/GLM-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 1.8, - "output": 7.2, - "cache_read": 0.45 - }, - "type": "chat" - }, + "input": 0.7, + "output": 2.3 + } + } + ] + }, + "inference": { + "id": "inference", + "name": "Inference", + "display_name": "Inference", + "api": "https://inference.net/v1", + "doc": "https://inference.net/models", + "models": [ { - "id": "openai/o4-mini-deep-research", - "name": "o4-mini-deep-research", - "display_name": "o4-mini-deep-research", + "id": "mistral/mistral-nemo-12b-instruct", + "name": "Mistral Nemo 12B Instruct", + "display_name": "Mistral Nemo 12B Instruct", "modalities": { "input": [ "text" @@ -60392,30 +58531,28 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 16000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-06-27", - "last_updated": "2025-06-27", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1.8, - "output": 7.2, - "cache_read": 0.45 - }, - "type": "chat" + "input": 0.038, + "output": 0.1 + } }, { - "id": "openai/gpt-4-classic-0314", - "name": "GPT-4-Classic-0314", - "display_name": "GPT-4-Classic-0314", + "id": "google/gemma-3", + "name": "Google Gemma 3", + "display_name": "Google Gemma 3", "modalities": { "input": [ "text", @@ -60426,217 +58563,216 @@ ] }, "limit": { - "context": 8192, + "context": 125000, "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2024-08-26", - "last_updated": "2024-08-26", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 27, - "output": 54 - }, - "type": "chat" + "input": 0.15, + "output": 0.3 + } }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o-mini", - "display_name": "GPT-4o-mini", + "id": "osmosis/osmosis-structure-0.6b", + "name": "Osmosis Structure 0.6B", + "display_name": "Osmosis Structure 0.6B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 4000, + "output": 2048 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.14, - "output": 0.54, - "cache_read": 0.068 - }, - "type": "chat" + "input": 0.1, + "output": 0.5 + } }, { - "id": "openai/gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "qwen/qwen3-embedding-4b", + "name": "Qwen 3 Embedding 4B", + "display_name": "Qwen 3 Embedding 4B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32000, + "output": 2048 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 - }, - "type": "chat" + "input": 0.01, + "output": 0 + } }, { - "id": "openai/dall-e-3", - "name": "DALL-E-3", - "display_name": "DALL-E-3", + "id": "qwen/qwen-2.5-7b-vision-instruct", + "name": "Qwen 2.5 7B Vision Instruct", + "display_name": "Qwen 2.5 7B Vision Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 800, - "output": 8192 + "context": 125000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2023-11-06", - "last_updated": "2023-11-06", - "type": "imageGeneration" + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0.2, + "output": 0.2 + } }, { - "id": "openai/sora-2-pro", - "name": "Sora-2-Pro", - "display_name": "Sora-2-Pro", + "id": "meta/llama-3.2-11b-vision-instruct", + "name": "Llama 3.2 11B Vision Instruct", + "display_name": "Llama 3.2 11B Vision Instruct", "modalities": { "input": [ "text", "image" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 16000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-10-06", - "last_updated": "2025-10-06", - "type": "chat" + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0.055, + "output": 0.055 + } }, { - "id": "openai/gpt-5-pro", - "name": "GPT-5-Pro", - "display_name": "GPT-5-Pro", + "id": "meta/llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 14, - "output": 110 - }, - "type": "chat" + "input": 0.025, + "output": 0.025 + } }, { - "id": "openai/gpt-5.2", - "name": "gpt-5.2", - "display_name": "gpt-5.2", + "id": "meta/llama-3.2-3b-instruct", + "name": "Llama 3.2 3B Instruct", + "display_name": "Llama 3.2 3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1.6, - "output": 13, - "cache_read": 0.16 - }, - "type": "chat" + "input": 0.02, + "output": 0.02 + } }, { - "id": "openai/gpt-4o-mini-search", - "name": "GPT-4o-mini-Search", - "display_name": "GPT-4o-mini-Search", + "id": "meta/llama-3.2-1b-instruct", + "name": "Llama 3.2 1B Instruct", + "display_name": "Llama 3.2 1B Instruct", "modalities": { "input": [ "text" @@ -60646,143 +58782,188 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 16000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-03-11", - "last_updated": "2025-03-11", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.14, - "output": 0.54 - }, - "type": "chat" - }, + "input": 0.01, + "output": 0.01 + } + } + ] + }, + "requesty": { + "id": "requesty", + "name": "Requesty", + "display_name": "Requesty", + "api": "https://router.requesty.ai/v1", + "doc": "https://requesty.ai/solution/llm-routing/models", + "models": [ { - "id": "stabilityai/stablediffusionxl", - "name": "StableDiffusionXL", - "display_name": "StableDiffusionXL", + "id": "xai/grok-4", + "name": "Grok 4", + "display_name": "Grok 4", "modalities": { "input": [ "text", "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 200, - "output": 8192 + "context": 256000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2023-07-09", - "last_updated": "2023-07-09", - "type": "chat" + "knowledge": "2025-01", + "release_date": "2025-09-09", + "last_updated": "2025-09-09", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.75, + "cache_write": 3 + } }, { - "id": "topazlabs-co/topazlabs", - "name": "TopazLabs", - "display_name": "TopazLabs", + "id": "xai/grok-4-fast", + "name": "Grok 4 Fast", + "display_name": "Grok 4 Fast", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 204, - "output": 8192 + "context": 2000000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2024-12-03", - "last_updated": "2024-12-03", - "type": "chat" + "knowledge": "2025-01", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05, + "cache_write": 0.2 + } }, { - "id": "lumalabs/ray2", - "name": "Ray2", - "display_name": "Ray2", + "id": "google/gemini-3-flash-preview", + "name": "Gemini 3 Flash", + "display_name": "Gemini 3 Flash", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 5000, - "output": 8192 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-02-20", - "last_updated": "2025-02-20", - "type": "chat" + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", + "cost": { + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 1 + } }, { - "id": "lumalabs/dream-machine", - "name": "Dream-Machine", - "display_name": "Dream-Machine", + "id": "google/gemini-3-pro-preview", + "name": "Gemini 3 Pro", + "display_name": "Gemini 3 Pro", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 5000, - "output": 8192 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2024-09-18", - "type": "chat" + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "cost": { + "input": 2, + "output": 12, + "cache_read": 0.2, + "cache_write": 4.5 + } }, { - "id": "anthropic/claude-opus-3", - "name": "Claude-Opus-3", - "display_name": "Claude-Opus-3", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -60790,34 +58971,37 @@ ] }, "limit": { - "context": 189096, - "output": 8192 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2024-03-04", - "last_updated": "2024-03-04", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 13, - "output": 64, - "cache_read": 1.3, - "cache_write": 16 - }, - "type": "chat" + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.55 + } }, { - "id": "anthropic/claude-opus-4", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -60825,10 +59009,10 @@ ] }, "limit": { - "context": 192512, - "output": 32768 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -60836,69 +59020,64 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-05-21", - "last_updated": "2025-05-21", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 13, - "output": 64, - "cache_read": 1.3, - "cache_write": 16 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.31, + "cache_write": 2.375 + } }, { - "id": "anthropic/claude-sonnet-3.7-reasoning", - "name": "Claude Sonnet 3.7 Reasoning", - "display_name": "Claude Sonnet 3.7 Reasoning", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1 Mini", + "display_name": "GPT-4.1 Mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 128000 + "context": 1047576, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 - }, - "type": "chat" + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 + } }, { - "id": "anthropic/claude-opus-4-search", - "name": "Claude Opus 4 Search", - "display_name": "Claude Opus 4 Search", + "id": "openai/gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 128000 + "context": 16000, + "output": 4000 }, "temperature": false, "tool_call": true, @@ -60908,104 +59087,98 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-06-20", - "last_updated": "2025-06-20", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 13, - "output": 64, - "cache_read": 1.3, - "cache_write": 16 - }, - "type": "chat" + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 + } }, { - "id": "anthropic/claude-sonnet-3.7", - "name": "Claude Sonnet 3.7", - "display_name": "Claude Sonnet 3.7", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 196608, + "context": 1047576, "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 - }, - "type": "chat" + "input": 2, + "output": 8, + "cache_read": 0.5 + } }, { - "id": "anthropic/claude-haiku-3.5-search", - "name": "Claude-Haiku-3.5-Search", - "display_name": "Claude-Haiku-3.5-Search", + "id": "openai/o4-mini", + "name": "o4 Mini", + "display_name": "o4 Mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 189096, - "output": 8192 + "context": 200000, + "output": 100000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-05-15", - "last_updated": "2025-05-15", + "knowledge": "2024-06", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.68, - "output": 3.4, - "cache_read": 0.068, - "cache_write": 0.85 - }, - "type": "chat" + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 + } }, { - "id": "anthropic/claude-haiku-4.5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "openai/gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 192000, - "output": 64000 + "context": 128000, + "output": 32000 }, "temperature": false, "tool_call": true, @@ -61015,33 +59188,68 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.85, - "output": 4.3, - "cache_read": 0.085, - "cache_write": 1.1 + "input": 0.25, + "output": 2, + "cache_read": 0.03 + } + }, + { + "id": "openai/gpt-4o-mini", + "name": "GPT-4o Mini", + "display_name": "GPT-4o Mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] }, - "type": "chat" + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 + } }, { - "id": "anthropic/claude-sonnet-4-reasoning", - "name": "Claude Sonnet 4 Reasoning", - "display_name": "Claude Sonnet 4 Reasoning", + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ "text", + "audio", "image", - "pdf" + "video" ], "output": [ - "text" + "text", + "audio", + "image" ] }, "limit": { - "context": 983040, - "output": 64000 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -61051,20 +59259,19 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-05-21", - "last_updated": "2025-05-21", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 - }, - "type": "chat" + "input": 1.25, + "output": 10, + "cache_read": 0.13 + } }, { - "id": "anthropic/claude-haiku-3", - "name": "Claude-Haiku-3", - "display_name": "Claude-Haiku-3", + "id": "anthropic/claude-opus-4", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ "text", @@ -61076,28 +59283,29 @@ ] }, "limit": { - "context": 189096, - "output": 8192 + "context": 200000, + "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2024-03-09", - "last_updated": "2024-03-09", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.21, - "output": 1.1, - "cache_read": 0.021, - "cache_write": 0.26 - }, - "type": "chat" + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } }, { - "id": "anthropic/claude-opus-4.1", + "id": "anthropic/claude-opus-4-1", "name": "Claude Opus 4.1", "display_name": "Claude Opus 4.1", "modalities": { @@ -61111,10 +59319,10 @@ ] }, "limit": { - "context": 196608, + "context": 200000, "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -61122,20 +59330,20 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2025-03-31", "release_date": "2025-08-05", "last_updated": "2025-08-05", "cost": { - "input": 13, - "output": 64, - "cache_read": 1.3, - "cache_write": 16 - }, - "type": "chat" + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } }, { - "id": "anthropic/claude-sonnet-3.7-search", - "name": "Claude Sonnet 3.7 Search", - "display_name": "Claude Sonnet 3.7 Search", + "id": "anthropic/claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", @@ -61147,10 +59355,10 @@ ] }, "limit": { - "context": 196608, - "output": 128000 + "context": 200000, + "output": 62000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -61158,20 +59366,20 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-05-15", - "last_updated": "2025-05-15", + "knowledge": "2025-02-01", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 - }, - "type": "chat" + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 + } }, { - "id": "anthropic/claude-opus-4-reasoning", - "name": "Claude Opus 4 Reasoning", - "display_name": "Claude Opus 4 Reasoning", + "id": "anthropic/claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ "text", @@ -61183,10 +59391,10 @@ ] }, "limit": { - "context": 196608, - "output": 32768 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -61194,20 +59402,20 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-05-21", - "last_updated": "2025-05-21", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 13, - "output": 64, - "cache_read": 1.3, - "cache_write": 16 - }, - "type": "chat" + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + } }, { - "id": "anthropic/claude-sonnet-3.5", - "name": "Claude-Sonnet-3.5", - "display_name": "Claude-Sonnet-3.5", + "id": "anthropic/claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", @@ -61219,30 +59427,31 @@ ] }, "limit": { - "context": 189096, - "output": 8192 + "context": 1000000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2024-06-05", - "last_updated": "2024-06-05", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "anthropic/claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "anthropic/claude-3-7-sonnet", + "name": "Claude Sonnet 3.7", + "display_name": "Claude Sonnet 3.7", "modalities": { "input": [ "text", @@ -61254,10 +59463,10 @@ ] }, "limit": { - "context": 983040, - "output": 32768 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -61265,20 +59474,20 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-05-21", - "last_updated": "2025-05-21", + "knowledge": "2024-01", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "anthropic/claude-opus-4.5", - "name": "claude-opus-4.5", - "display_name": "claude-opus-4.5", + "id": "anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ "text", @@ -61290,10 +59499,10 @@ ] }, "limit": { - "context": 196608, + "context": 200000, "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -61301,162 +59510,159 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-11-21", - "last_updated": "2025-11-21", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 4.3, - "output": 21, - "cache_read": 0.43, - "cache_write": 5.3 - }, - "type": "chat" - }, + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } + } + ] + }, + "morph": { + "id": "morph", + "name": "Morph", + "display_name": "Morph", + "api": "https://api.morphllm.com/v1", + "doc": "https://docs.morphllm.com/api-reference/introduction", + "models": [ { - "id": "anthropic/claude-haiku-3.5", - "name": "Claude-Haiku-3.5", - "display_name": "Claude-Haiku-3.5", + "id": "morph-v3-large", + "name": "Morph v3 Large", + "display_name": "Morph v3 Large", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 189096, - "output": 8192 + "context": 32000, + "output": 32000 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-10-01", - "last_updated": "2024-10-01", + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "cost": { - "input": 0.68, - "output": 3.4, - "cache_read": 0.068, - "cache_write": 0.85 - }, - "type": "chat" + "input": 0.9, + "output": 1.9 + } }, { - "id": "anthropic/claude-sonnet-3.5-june", - "name": "Claude-Sonnet-3.5-June", - "display_name": "Claude-Sonnet-3.5-June", + "id": "auto", + "name": "Auto", + "display_name": "Auto", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 189096, - "output": 8192 + "context": 32000, + "output": 32000 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-11-18", - "last_updated": "2024-11-18", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 - }, - "type": "chat" + "input": 0.85, + "output": 1.55 + } }, { - "id": "anthropic/claude-sonnet-4.5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "morph-v3-fast", + "name": "Morph v3 Fast", + "display_name": "Morph v3 Fast", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 983040, - "output": 32768 + "context": 16000, + "output": 16000 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-26", - "last_updated": "2025-09-26", + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 - }, - "type": "chat" - }, + "input": 0.8, + "output": 1.2 + } + } + ] + }, + "lmstudio": { + "id": "lmstudio", + "name": "LMStudio", + "display_name": "LMStudio", + "api": "http://127.0.0.1:1234/v1", + "doc": "https://lmstudio.ai/models", + "models": [ { - "id": "anthropic/claude-sonnet-4-search", - "name": "Claude Sonnet 4 Search", - "display_name": "Claude Sonnet 4 Search", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 983040, - "output": 128000 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-06-20", - "last_updated": "2025-06-20", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "trytako/tako", - "name": "Tako", - "display_name": "Tako", + "id": "qwen/qwen3-30b-a3b-2507", + "name": "Qwen3 30B A3B 2507", + "display_name": "Qwen3 30B A3B 2507", "modalities": { "input": [ "text" @@ -61466,24 +59672,28 @@ ] }, "limit": { - "context": 2048, - "output": 8192 + "context": 262144, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "novita/glm-4.7", - "name": "glm-4.7", - "display_name": "glm-4.7", + "id": "qwen/qwen3-coder-30b", + "name": "Qwen3 Coder 30B", + "display_name": "Qwen3 Coder 30B", "modalities": { "input": [ "text" @@ -61493,25 +59703,37 @@ ] }, "limit": { - "context": 205000, - "output": 131072 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-22", - "last_updated": "2025-12-22", - "type": "chat" - }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "cost": { + "input": 0, + "output": 0 + } + } + ] + }, + "friendli": { + "id": "friendli", + "name": "Friendli", + "display_name": "Friendli", + "api": "https://api.friendli.ai/serverless/v1", + "doc": "https://friendli.ai/docs/guides/serverless_endpoints/introduction", + "models": [ { - "id": "novita/kimi-k2-thinking", - "name": "kimi-k2-thinking", - "display_name": "kimi-k2-thinking", + "id": "MiniMaxAI/MiniMax-M2.1", + "name": "MiniMax M2.1", + "display_name": "MiniMax M2.1", "modalities": { "input": [ "text" @@ -61521,25 +59743,28 @@ ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 196608, + "output": 196608 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-07", - "last_updated": "2025-11-07", - "type": "chat" + "attachment": false, + "open_weights": true, + "release_date": "2026-01-13", + "last_updated": "2026-01-29", + "cost": { + "input": 0.3, + "output": 1.2 + } }, { - "id": "novita/kat-coder-pro", - "name": "kat-coder-pro", - "display_name": "kat-coder-pro", + "id": "LGAI-EXAONE/K-EXAONE-236B-A23B", + "name": "K EXAONE 236B A23B", + "display_name": "K EXAONE 236B A23B", "modalities": { "input": [ "text" @@ -61549,108 +59774,28 @@ ] }, "limit": { - "context": 256000, - "output": 8192 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-16", - "last_updated": "2025-12-16", - "type": "chat" - }, - { - "id": "novita/glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-30", - "last_updated": "2025-09-30", - "type": "chat" - }, - { - "id": "novita/minimax-m2.1", - "name": "minimax-m2.1", - "display_name": "minimax-m2.1", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 205000, - "output": 131072 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-26", - "last_updated": "2025-12-26", - "type": "chat" - }, - { - "id": "novita/glm-4.6v", - "name": "glm-4.6v", - "display_name": "glm-4.6v", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131000, - "output": 32768 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-09", - "last_updated": "2025-12-09", - "type": "chat" + "attachment": false, + "open_weights": true, + "release_date": "2025-12-31", + "last_updated": "2026-01-08", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "cerebras/gpt-oss-120b-cs", - "name": "gpt-oss-120b-cs", - "display_name": "gpt-oss-120b-cs", + "id": "LGAI-EXAONE/EXAONE-4.0.1-32B", + "name": "EXAONE 4.0.1 32B", + "display_name": "EXAONE 4.0.1 32B", "modalities": { "input": [ "text" @@ -61660,61 +59805,28 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131072, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-06", - "last_updated": "2025-08-06", - "type": "chat" + "attachment": false, + "open_weights": true, + "release_date": "2025-07-31", + "last_updated": "2025-12-23", + "cost": { + "input": 0.6, + "output": 1 + } }, { - "id": "cerebras/zai-glm-4.6-cs", - "name": "zai-glm-4.6-cs", - "display_name": "zai-glm-4.6-cs", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131000, - "output": 40000 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-11", - "last_updated": "2025-11-11", - "type": "chat" - } - ] - }, - "cerebras": { - "id": "cerebras", - "name": "Cerebras", - "display_name": "Cerebras", - "doc": "https://inference-docs.cerebras.ai/models/overview", - "models": [ - { - "id": "zai-glm-4.7", - "name": "Z.AI GLM-4.7", - "display_name": "Z.AI GLM-4.7", + "id": "meta-llama/Llama-3.1-8B-Instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ "text" @@ -61725,7 +59837,7 @@ }, "limit": { "context": 131072, - "output": 40000 + "output": 8000 }, "temperature": true, "tool_call": true, @@ -61734,20 +59846,17 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-01-10", - "last_updated": "2026-01-10", + "release_date": "2024-08-01", + "last_updated": "2025-12-23", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, - "type": "chat" + "input": 0.1, + "output": 0.1 + } }, { - "id": "qwen-3-235b-a22b-instruct-2507", - "name": "Qwen 3 235B Instruct", - "display_name": "Qwen 3 235B Instruct", + "id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ "text" @@ -61757,8 +59866,8 @@ ] }, "limit": { - "context": 131000, - "output": 32000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -61767,19 +59876,17 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-22", - "last_updated": "2025-07-22", + "release_date": "2024-08-01", + "last_updated": "2025-12-23", "cost": { "input": 0.6, - "output": 1.2 - }, - "type": "chat" + "output": 0.6 + } }, { - "id": "zai-glm-4.6", - "name": "Z.AI GLM-4.6", - "display_name": "Z.AI GLM-4.6", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -61789,8 +59896,8 @@ ] }, "limit": { - "context": 131072, - "output": 40960 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -61799,20 +59906,17 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-11-05", - "last_updated": "2025-11-05", + "release_date": "2025-07-29", + "last_updated": "2026-01-29", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, - "type": "chat" + "input": 0.2, + "output": 0.8 + } }, { - "id": "gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "zai-org/GLM-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ "text" @@ -61822,8 +59926,8 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 202752, + "output": 202752 }, "temperature": true, "tool_call": true, @@ -61833,138 +59937,179 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 0.25, - "output": 0.69 - }, - "type": "chat" + "release_date": "2025-12-22", + "last_updated": "2026-01-29" } ] }, - "ollama": { - "id": "ollama", - "name": "Ollama Cloud", - "display_name": "Ollama Cloud", - "api": "https://ollama.com/v1", - "doc": "https://docs.ollama.com/cloud", + "sap-ai-core": { + "id": "sap-ai-core", + "name": "SAP AI Core", + "display_name": "SAP AI Core", + "doc": "https://help.sap.com/docs/sap-ai-core", "models": [ { - "id": "gemini-3-pro-preview:latest", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "anthropic--claude-4.5-opus", + "name": "anthropic--claude-4.5-opus", + "display_name": "anthropic--claude-4.5-opus", "modalities": { "input": [ "text", "image", - "audio", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 200000, "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-10", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", - "type": "chat" + "knowledge": "2025-04-30", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + } }, { - "id": "gpt-oss:latest", - "name": "GPT-OSS Latest", - "display_name": "GPT-OSS Latest", + "id": "anthropic--claude-3.5-sonnet", + "name": "anthropic--claude-3.5-sonnet", + "display_name": "anthropic--claude-3.5-sonnet", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "gpt-oss:20b", - "name": "GPT-OSS 20B", - "display_name": "GPT-OSS 20B", + "id": "anthropic--claude-4.5-haiku", + "name": "anthropic--claude-4.5-haiku", + "display_name": "anthropic--claude-4.5-haiku", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-01", + "last_updated": "2025-10-01", + "cost": { + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 + } }, { - "id": "gpt-oss:120b", - "name": "GPT-OSS 120B", - "display_name": "GPT-OSS 120B", + "id": "anthropic--claude-4-opus", + "name": "anthropic--claude-4-opus", + "display_name": "anthropic--claude-4-opus", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 32000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-01-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } }, { - "id": "gpt-oss:20b-cloud", - "name": "GPT-OSS 20B", - "display_name": "GPT-OSS 20B", + "id": "gemini-2.5-flash", + "name": "gemini-2.5-flash", + "display_name": "gemini-2.5-flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -61972,19 +60117,27 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-25", + "last_updated": "2025-06-05", + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "input_audio": 1 + } }, { - "id": "gpt-oss:120b-cloud", - "name": "GPT-OSS 120B", - "display_name": "GPT-OSS 120B", + "id": "anthropic--claude-3-haiku", + "name": "anthropic--claude-3-haiku", + "display_name": "anthropic--claude-3-haiku", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -61992,47 +60145,64 @@ }, "limit": { "context": 200000, - "output": 8192 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2023-08-31", + "release_date": "2024-03-13", + "last_updated": "2024-03-13", + "cost": { + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 + } }, { - "id": "qwen3-vl:latest", - "name": "Qwen3-VL Latest", - "display_name": "Qwen3-VL Latest", + "id": "anthropic--claude-3-sonnet", + "name": "anthropic--claude-3-sonnet", + "display_name": "anthropic--claude-3-sonnet", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 200000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2023-08-31", + "release_date": "2024-03-04", + "last_updated": "2024-03-04", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "qwen3-vl:2b", - "name": "Qwen3-VL 2B", - "display_name": "Qwen3-VL 2B", + "id": "gpt-5-nano", + "name": "gpt-5-nano", + "display_name": "gpt-5-nano", "modalities": { "input": [ "text", @@ -62043,42 +60213,66 @@ ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 400000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 + } }, { - "id": "qwen3-vl:4b", - "name": "Qwen3-VL 4B", - "display_name": "Qwen3-VL 4B", + "id": "anthropic--claude-3.7-sonnet", + "name": "anthropic--claude-3.7-sonnet", + "display_name": "anthropic--claude-3.7-sonnet", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 200000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-31", + "release_date": "2025-02-24", + "last_updated": "2025-02-24", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "qwen3-vl:8b", - "name": "Qwen3-VL 8B", - "display_name": "Qwen3-VL 8B", + "id": "gpt-5-mini", + "name": "gpt-5-mini", + "display_name": "gpt-5-mini", "modalities": { "input": [ "text", @@ -62089,385 +60283,619 @@ ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 400000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" - }, - { - "id": "qwen3-vl:30b", - "name": "Qwen3-VL 30B", - "display_name": "Qwen3-VL 30B", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 0.25, + "output": 2, + "cache_read": 0.025 + } + }, + { + "id": "anthropic--claude-4.5-sonnet", + "name": "anthropic--claude-4.5-sonnet", + "display_name": "anthropic--claude-4.5-sonnet", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 200000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-01-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "qwen3-vl:32b", - "name": "Qwen3-VL 32B", - "display_name": "Qwen3-VL 32B", + "id": "gemini-2.5-pro", + "name": "gemini-2.5-pro", + "display_name": "gemini-2.5-pro", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 1048576, "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-25", + "last_updated": "2025-06-05", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125 + } }, { - "id": "qwen3-vl:235b", - "name": "Qwen3-VL 235B", - "display_name": "Qwen3-VL 235B", + "id": "anthropic--claude-3-opus", + "name": "anthropic--claude-3-opus", + "display_name": "anthropic--claude-3-opus", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 200000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2023-08-31", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", + "cost": { + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } }, { - "id": "qwen3-vl:235b-cloud", - "name": "Qwen3-VL 235B Cloud", - "display_name": "Qwen3-VL 235B Cloud", + "id": "anthropic--claude-4-sonnet", + "name": "anthropic--claude-4-sonnet", + "display_name": "anthropic--claude-4-sonnet", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 200000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-01-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "qwen3-vl:235b-instruct-cloud", - "name": "Qwen3-VL 235B Instruct Cloud", - "display_name": "Qwen3-VL 235B Instruct Cloud", + "id": "gpt-5", + "name": "gpt-5", + "display_name": "gpt-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 400000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" - }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.13 + } + } + ] + }, + "anthropic": { + "id": "anthropic", + "name": "Anthropic", + "display_name": "Anthropic", + "doc": "https://docs.anthropic.com/en/docs/about-claude/models", + "models": [ { - "id": "deepseek-r1:latest", - "name": "DeepSeek-R1 Latest", - "display_name": "DeepSeek-R1 Latest", + "id": "claude-opus-4-0", + "name": "Claude Opus 4 (latest)", + "display_name": "Claude Opus 4 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 32000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } }, { - "id": "deepseek-r1:1.5b", - "name": "DeepSeek-R1 1.5B", - "display_name": "DeepSeek-R1 1.5B", + "id": "claude-3-5-sonnet-20241022", + "name": "Claude Sonnet 3.5 v2", + "display_name": "Claude Sonnet 3.5 v2", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "deepseek-r1:7b", - "name": "DeepSeek-R1 7B", - "display_name": "DeepSeek-R1 7B", + "id": "claude-opus-4-1", + "name": "Claude Opus 4.1 (latest)", + "display_name": "Claude Opus 4.1 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 32000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } }, { - "id": "deepseek-r1:8b", - "name": "DeepSeek-R1 8B", - "display_name": "DeepSeek-R1 8B", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5 (latest)", + "display_name": "Claude Haiku 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "cost": { + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 + } }, { - "id": "deepseek-r1:14b", - "name": "DeepSeek-R1 14B", - "display_name": "DeepSeek-R1 14B", + "id": "claude-3-5-sonnet-20240620", + "name": "Claude Sonnet 3.5", + "display_name": "Claude Sonnet 3.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-04-30", + "release_date": "2024-06-20", + "last_updated": "2024-06-20", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "deepseek-r1:32b", - "name": "DeepSeek-R1 32B", - "display_name": "DeepSeek-R1 32B", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1000000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25, + "context_over_200k": { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5 + } + } }, { - "id": "deepseek-r1:70b", - "name": "DeepSeek-R1 70B", - "display_name": "DeepSeek-R1 70B", + "id": "claude-3-5-haiku-latest", + "name": "Claude Haiku 3.5 (latest)", + "display_name": "Claude Haiku 3.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "cost": { + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 + } }, { - "id": "deepseek-r1:671b", - "name": "DeepSeek-R1 671B", - "display_name": "DeepSeek-R1 671B", + "id": "claude-opus-4-5", + "name": "Claude Opus 4.5 (latest)", + "display_name": "Claude Opus 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 160000, - "output": 40000 + "context": 200000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + } }, { - "id": "qwen3-coder:latest", - "name": "Qwen3-Coder Latest", - "display_name": "Qwen3-Coder Latest", + "id": "claude-3-opus-20240229", + "name": "Claude Opus 3", + "display_name": "Claude Opus 3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 200000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2023-08-31", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", + "cost": { + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } }, { - "id": "qwen3-coder:30b", - "name": "Qwen3-Coder 30B", - "display_name": "Qwen3-Coder 30B", + "id": "claude-opus-4-5-20251101", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 200000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + } }, { - "id": "qwen3-coder:480b", - "name": "Qwen3-Coder 480B", - "display_name": "Qwen3-Coder 480B", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5 (latest)", + "display_name": "Claude Sonnet 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 200000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "qwen3-coder:480b-cloud", - "name": "Qwen3 Coder 480B", - "display_name": "Qwen3 Coder 480B", + "id": "claude-sonnet-4-5-20250929", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -62475,162 +60903,249 @@ }, "limit": { "context": 200000, - "output": 8192 + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-22", - "last_updated": "2025-07-22", - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "gemma3:latest", - "name": "Gemma3 Latest", - "display_name": "Gemma3 Latest", + "id": "claude-sonnet-4-20250514", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "gemma3:270m", - "name": "Gemma3 270M", - "display_name": "Gemma3 270M", + "id": "claude-opus-4-20250514", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } }, { - "id": "gemma3:1b", - "name": "Gemma3 1B", - "display_name": "Gemma3 1B", + "id": "claude-3-5-haiku-20241022", + "name": "Claude Haiku 3.5", + "display_name": "Claude Haiku 3.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32000, + "context": 200000, "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "cost": { + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 + } }, { - "id": "gemma3:4b", - "name": "Gemma3 4B", - "display_name": "Gemma3 4B", + "id": "claude-3-haiku-20240307", + "name": "Claude Haiku 3", + "display_name": "Claude Haiku 3", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2023-08-31", + "release_date": "2024-03-13", + "last_updated": "2024-03-13", + "cost": { + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 + } }, { - "id": "gemma3:12b", - "name": "Gemma3 12B", - "display_name": "Gemma3 12B", + "id": "claude-3-7-sonnet-20250219", + "name": "Claude Sonnet 3.7", + "display_name": "Claude Sonnet 3.7", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-31", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "gemma3:27b", - "name": "Gemma3 27B", - "display_name": "Gemma3 27B", + "id": "claude-3-7-sonnet-latest", + "name": "Claude Sonnet 3.7 (latest)", + "display_name": "Claude Sonnet 3.7 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-31", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "glm-4.6:cloud", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "claude-sonnet-4-0", + "name": "Claude Sonnet 4 (latest)", + "display_name": "Claude Sonnet 4 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -62638,276 +61153,428 @@ }, "limit": { "context": 200000, - "output": 8192 + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "qwen3:latest", - "name": "Qwen3 Latest", - "display_name": "Qwen3 Latest", + "id": "claude-opus-4-1-20250805", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 40000, - "output": 10000 + "context": 200000, + "output": 32000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } }, { - "id": "qwen3:0.6b", - "name": "Qwen3 0.6B", - "display_name": "Qwen3 0.6B", + "id": "claude-3-sonnet-20240229", + "name": "Claude Sonnet 3", + "display_name": "Claude Sonnet 3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 40000, - "output": 10000 + "context": 200000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2023-08-31", + "release_date": "2024-03-04", + "last_updated": "2024-03-04", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 0.3 + } }, { - "id": "qwen3:1.7b", - "name": "Qwen3 1.7B", - "display_name": "Qwen3 1.7B", + "id": "claude-haiku-4-5-20251001", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 40000, - "output": 10000 + "context": 200000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" - }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "cost": { + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 + } + } + ] + }, + "gitlab": { + "id": "gitlab", + "name": "GitLab Duo", + "display_name": "GitLab Duo", + "doc": "https://docs.gitlab.com/user/duo_agent_platform/", + "models": [ { - "id": "qwen3:4b", - "name": "Qwen3 4B", - "display_name": "Qwen3 4B", + "id": "duo-chat-gpt-5-1", + "name": "Agentic Chat (GPT-5.1)", + "display_name": "Agentic Chat (GPT-5.1)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 400000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2026-01-22", + "last_updated": "2026-01-22", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "qwen3:8b", - "name": "Qwen3 8B", - "display_name": "Qwen3 8B", + "id": "duo-chat-opus-4-5", + "name": "Agentic Chat (Claude Opus 4.5)", + "display_name": "Agentic Chat (Claude Opus 4.5)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 40000, - "output": 10000 + "context": 200000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2026-01-08", + "last_updated": "2026-01-08", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } }, { - "id": "qwen3:14b", - "name": "Qwen3 14B", - "display_name": "Qwen3 14B", + "id": "duo-chat-sonnet-4-5", + "name": "Agentic Chat (Claude Sonnet 4.5)", + "display_name": "Agentic Chat (Claude Sonnet 4.5)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 40000, - "output": 10000 + "context": 200000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2026-01-08", + "last_updated": "2026-01-08", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } }, { - "id": "qwen3:30b", - "name": "Qwen3 30B", - "display_name": "Qwen3 30B", + "id": "duo-chat-gpt-5-mini", + "name": "Agentic Chat (GPT-5 Mini)", + "display_name": "Agentic Chat (GPT-5 Mini)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 400000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2026-01-22", + "last_updated": "2026-01-22", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "qwen3:32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "duo-chat-gpt-5-2", + "name": "Agentic Chat (GPT-5.2)", + "display_name": "Agentic Chat (GPT-5.2)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 40000, - "output": 10000 + "context": 400000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-01-23", + "last_updated": "2026-01-23", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "qwen3:235b", - "name": "Qwen3 235B", - "display_name": "Qwen3 235B", + "id": "duo-chat-gpt-5-2-codex", + "name": "Agentic Chat (GPT-5.2 Codex)", + "display_name": "Agentic Chat (GPT-5.2 Codex)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 400000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-01-22", + "last_updated": "2026-01-22", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "deepseek-v3.1:latest", - "name": "DeepSeek-V3.1 Latest", - "display_name": "DeepSeek-V3.1 Latest", + "id": "duo-chat-gpt-5-codex", + "name": "Agentic Chat (GPT-5 Codex)", + "display_name": "Agentic Chat (GPT-5 Codex)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 160000, - "output": 40000 + "context": 400000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2026-01-22", + "last_updated": "2026-01-22", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "deepseek-v3.1:671b", - "name": "DeepSeek-V3.1 671B", - "display_name": "DeepSeek-V3.1 671B", + "id": "duo-chat-haiku-4-5", + "name": "Agentic Chat (Claude Haiku 4.5)", + "display_name": "Agentic Chat (Claude Haiku 4.5)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 160000, - "output": 40000 + "context": 200000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" - }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2026-01-08", + "last_updated": "2026-01-08", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } + } + ] + }, + "fireworks-ai": { + "id": "fireworks-ai", + "name": "Fireworks AI", + "display_name": "Fireworks AI", + "api": "https://api.fireworks.ai/inference/v1/", + "doc": "https://fireworks.ai/docs/", + "models": [ { - "id": "deepseek-v3.1:671b-cloud", - "name": "DeepSeek-V3.1 671B", - "display_name": "DeepSeek-V3.1 671B", + "id": "accounts/fireworks/models/deepseek-r1-0528", + "name": "Deepseek R1 05/28", + "display_name": "Deepseek R1 05/28", "modalities": { "input": [ "text" @@ -62918,7 +61585,7 @@ }, "limit": { "context": 160000, - "output": 8192 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -62928,14 +61595,18 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", - "type": "chat" + "knowledge": "2025-05", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", + "cost": { + "input": 3, + "output": 8 + } }, { - "id": "llama3.1:latest", - "name": "Llama 3.1 Latest", - "display_name": "Llama 3.1 Latest", + "id": "accounts/fireworks/models/deepseek-v3p1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ "text" @@ -62945,19 +61616,29 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 163840, + "output": 163840 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", + "cost": { + "input": 0.56, + "output": 1.68 + } }, { - "id": "llama3.1:8b", - "name": "Llama 3.1 8B", - "display_name": "Llama 3.1 8B", + "id": "accounts/fireworks/models/deepseek-v3p2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -62967,21 +61648,32 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 160000, + "output": 160000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" - }, - { - "id": "llama3.1:70b", - "name": "Llama 3.1 70B", - "display_name": "Llama 3.1 70B", - "modalities": { - "input": [ + "attachment": false, + "open_weights": true, + "knowledge": "2025-09", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "cost": { + "input": 0.56, + "output": 1.68, + "cache_read": 0.28 + } + }, + { + "id": "accounts/fireworks/models/minimax-m2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", + "modalities": { + "input": [ "text" ], "output": [ @@ -62989,19 +61681,30 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 192000, + "output": 192000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.15 + } }, { - "id": "llama3.1:405b", - "name": "Llama 3.1 405B", - "display_name": "Llama 3.1 405B", + "id": "accounts/fireworks/models/minimax-m2p1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" @@ -63011,19 +61714,29 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 200000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.15 + } }, { - "id": "llama3.2:latest", - "name": "Llama 3.2 Latest", - "display_name": "Llama 3.2 Latest", + "id": "accounts/fireworks/models/glm-4p7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ "text" @@ -63033,19 +61746,30 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 198000, + "output": 198000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "cost": { + "input": 0.6, + "output": 2.2, + "cache_read": 0.3 + } }, { - "id": "llama3.2:1b", - "name": "Llama 3.2 1B", - "display_name": "Llama 3.2 1B", + "id": "accounts/fireworks/models/deepseek-v3-0324", + "name": "Deepseek V3 03-24", + "display_name": "Deepseek V3 03-24", "modalities": { "input": [ "text" @@ -63055,19 +61779,28 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 160000, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", + "cost": { + "input": 0.9, + "output": 0.9 + } }, { - "id": "llama3.2:3b", - "name": "Llama 3.2 3B", - "display_name": "Llama 3.2 3B", + "id": "accounts/fireworks/models/glm-4p6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ "text" @@ -63077,19 +61810,30 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 198000, + "output": 198000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-10-01", + "last_updated": "2025-10-01", + "cost": { + "input": 0.55, + "output": 2.19, + "cache_read": 0.28 + } }, { - "id": "phi3:latest", - "name": "Phi-3 Latest", - "display_name": "Phi-3 Latest", + "id": "accounts/fireworks/models/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -63099,19 +61843,29 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 256000, + "output": 256000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "release_date": "2025-11-06", + "last_updated": "2025-11-06", + "cost": { + "input": 0.6, + "output": 2.5, + "cache_read": 0.3 + } }, { - "id": "phi3:3.8b", - "name": "Phi-3 3.8B", - "display_name": "Phi-3 3.8B", + "id": "accounts/fireworks/models/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ "text" @@ -63122,40 +61876,62 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-11", + "last_updated": "2025-07-11", + "cost": { + "input": 1, + "output": 3 + } }, { - "id": "phi3:14b", - "name": "Phi-3 14B", - "display_name": "Phi-3 14B", + "id": "accounts/fireworks/models/kimi-k2p5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 256000, + "output": 256000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "cost": { + "input": 0.6, + "output": 3, + "cache_read": 0.1 + } }, { - "id": "mistral-nemo:latest", - "name": "Mistral-Nemo Latest", - "display_name": "Mistral-Nemo Latest", + "id": "accounts/fireworks/models/qwen3-235b-a22b", + "name": "Qwen3 235B-A22B", + "display_name": "Qwen3 235B-A22B", "modalities": { "input": [ "text" @@ -63165,19 +61941,29 @@ ] }, "limit": { - "context": 1000000, - "output": 250000 + "context": 128000, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", + "cost": { + "input": 0.22, + "output": 0.88 + } }, { - "id": "mistral-nemo:12b", - "name": "Mistral-Nemo 12B", - "display_name": "Mistral-Nemo 12B", + "id": "accounts/fireworks/models/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -63187,88 +61973,121 @@ ] }, "limit": { - "context": 1000000, - "output": 250000 + "context": 131072, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0.05, + "output": 0.2 + } }, { - "id": "llava:latest", - "name": "LLaVA Latest", - "display_name": "LLaVA Latest", + "id": "accounts/fireworks/models/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 131072, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0.15, + "output": 0.6 + } }, { - "id": "llava:7b", - "name": "LLaVA 7B", - "display_name": "LLaVA 7B", + "id": "accounts/fireworks/models/glm-4p5-air", + "name": "GLM 4.5 Air", + "display_name": "GLM 4.5 Air", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 131072, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-08-01", + "last_updated": "2025-08-01", + "cost": { + "input": 0.22, + "output": 0.88 + } }, { - "id": "llava:13b", - "name": "LLaVA 13B", - "display_name": "LLaVA 13B", + "id": "accounts/fireworks/models/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 4000, - "output": 1000 + "context": 256000, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "release_date": "2025-07-22", + "last_updated": "2025-07-22", + "cost": { + "input": 0.45, + "output": 1.8 + } }, { - "id": "llava:34b", - "name": "LLaVA 34B", - "display_name": "LLaVA 34B", + "id": "accounts/fireworks/models/glm-4p5", + "name": "GLM 4.5", + "display_name": "GLM 4.5", "modalities": { "input": [ "text" @@ -63278,19 +62097,38 @@ ] }, "limit": { - "context": 4000, - "output": 1000 + "context": 131072, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" - }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", + "cost": { + "input": 0.55, + "output": 2.19 + } + } + ] + }, + "io-net": { + "id": "io-net", + "name": "IO.NET", + "display_name": "IO.NET", + "api": "https://api.intelligence.io.solutions/api/v1", + "doc": "https://io.net/docs/guides/intelligence/io-intelligence", + "models": [ { - "id": "codellama:latest", - "name": "CodeLlama Latest", - "display_name": "CodeLlama Latest", + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ "text" @@ -63300,19 +62138,30 @@ ] }, "limit": { - "context": 16000, - "output": 4000 + "context": 32768, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2024-09-05", + "last_updated": "2024-09-05", + "cost": { + "input": 0.39, + "output": 1.9, + "cache_read": 0.195, + "cache_write": 0.78 + } }, { - "id": "codellama:7b", - "name": "CodeLlama 7B", - "display_name": "CodeLlama 7B", + "id": "moonshotai/Kimi-K2-Thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -63322,19 +62171,31 @@ ] }, "limit": { - "context": 16000, - "output": 4000 + "context": 32768, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", + "cost": { + "input": 0.55, + "output": 2.25, + "cache_read": 0.275, + "cache_write": 1.1 + } }, { - "id": "codellama:13b", - "name": "CodeLlama 13B", - "display_name": "CodeLlama 13B", + "id": "openai/gpt-oss-20b", + "name": "GPT-OSS 20B", + "display_name": "GPT-OSS 20B", "modalities": { "input": [ "text" @@ -63344,19 +62205,30 @@ ] }, "limit": { - "context": 16000, - "output": 4000 + "context": 64000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "cost": { + "input": 0.03, + "output": 0.14, + "cache_read": 0.015, + "cache_write": 0.06 + } }, { - "id": "codellama:34b", - "name": "CodeLlama 34B", - "display_name": "CodeLlama 34B", + "id": "openai/gpt-oss-120b", + "name": "GPT-OSS 120B", + "display_name": "GPT-OSS 120B", "modalities": { "input": [ "text" @@ -63366,19 +62238,30 @@ ] }, "limit": { - "context": 16000, - "output": 4000 + "context": 131072, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "cost": { + "input": 0.04, + "output": 0.4, + "cache_read": 0.02, + "cache_write": 0.08 + } }, { - "id": "codellama:70b", - "name": "CodeLlama 70B", - "display_name": "CodeLlama 70B", + "id": "mistralai/Devstral-Small-2505", + "name": "Devstral Small 2505", + "display_name": "Devstral Small 2505", "modalities": { "input": [ "text" @@ -63388,19 +62271,30 @@ ] }, "limit": { - "context": 2000, - "output": 500 + "context": 128000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2025-05-01", + "last_updated": "2025-05-01", + "cost": { + "input": 0.05, + "output": 0.22, + "cache_read": 0.025, + "cache_write": 0.1 + } }, { - "id": "mixtral:latest", - "name": "Mixtral Latest", - "display_name": "Mixtral Latest", + "id": "mistralai/Mistral-Nemo-Instruct-2407", + "name": "Mistral Nemo Instruct 2407", + "display_name": "Mistral Nemo Instruct 2407", "modalities": { "input": [ "text" @@ -63410,41 +62304,30 @@ ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 128000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" - }, - { - "id": "mixtral:8x7b", - "name": "Mixtral 8x7B", - "display_name": "Mixtral 8x7B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 32000, - "output": 8192 - }, - "tool_call": true, - "reasoning": { - "supported": false - }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-05", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", + "cost": { + "input": 0.02, + "output": 0.04, + "cache_read": 0.01, + "cache_write": 0.04 + } }, { - "id": "mixtral:8x22b", - "name": "Mixtral 8x22B", - "display_name": "Mixtral 8x22B", + "id": "mistralai/Magistral-Small-2506", + "name": "Magistral Small 2506", + "display_name": "Magistral Small 2506", "modalities": { "input": [ "text" @@ -63454,41 +62337,64 @@ ] }, "limit": { - "context": 64000, - "output": 16000 + "context": 128000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", + "cost": { + "input": 0.5, + "output": 1.5, + "cache_read": 0.25, + "cache_write": 1 + } }, { - "id": "deepseek-coder:latest", - "name": "DeepSeek-Coder Latest", - "display_name": "DeepSeek-Coder Latest", + "id": "mistralai/Mistral-Large-Instruct-2411", + "name": "Mistral Large Instruct 2411", + "display_name": "Mistral Large Instruct 2411", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4000 + "context": 128000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", + "cost": { + "input": 2, + "output": 6, + "cache_read": 1, + "cache_write": 4 + } }, { - "id": "deepseek-coder:1.3b", - "name": "DeepSeek-Coder 1.3B", - "display_name": "DeepSeek-Coder 1.3B", + "id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ "text" @@ -63498,44 +62404,68 @@ ] }, "limit": { - "context": 16000, - "output": 4000 + "context": 128000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0.13, + "output": 0.38, + "cache_read": 0.065, + "cache_write": 0.26 + } }, { - "id": "deepseek-coder:6.7b", - "name": "DeepSeek-Coder 6.7B", - "display_name": "DeepSeek-Coder 6.7B", + "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", + "name": "Llama 4 Maverick 17B 128E Instruct", + "display_name": "Llama 4 Maverick 17B 128E Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4000 + "context": 430000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-15", + "last_updated": "2025-01-15", + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.075, + "cache_write": 0.3 + } }, { - "id": "deepseek-coder:33b", - "name": "DeepSeek-Coder 33B", - "display_name": "DeepSeek-Coder 33B", + "id": "meta-llama/Llama-3.2-90B-Vision-Instruct", + "name": "Llama 3.2 90B Vision Instruct", + "display_name": "Llama 3.2 90B Vision Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -63543,41 +62473,62 @@ }, "limit": { "context": 16000, - "output": 4000 + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "cost": { + "input": 0.35, + "output": 0.4, + "cache_read": 0.175, + "cache_write": 0.7 + } }, { - "id": "qwen2.5vl:latest", - "name": "Qwen2.5-VL Latest", - "display_name": "Qwen2.5-VL Latest", + "id": "Intel/Qwen3-Coder-480B-A35B-Instruct-int4-mixed-ar", + "name": "Qwen 3 Coder 480B", + "display_name": "Qwen 3 Coder 480B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 125000, - "output": 31250 + "context": 106000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-15", + "last_updated": "2025-01-15", + "cost": { + "input": 0.22, + "output": 0.95, + "cache_read": 0.11, + "cache_write": 0.44 + } }, { - "id": "qwen2.5vl:3b", - "name": "Qwen2.5-VL 3B", - "display_name": "Qwen2.5-VL 3B", + "id": "Qwen/Qwen2.5-VL-32B-Instruct", + "name": "Qwen 2.5 VL 32B Instruct", + "display_name": "Qwen 2.5 VL 32B Instruct", "modalities": { "input": [ "text", @@ -63588,88 +62539,130 @@ ] }, "limit": { - "context": 125000, - "output": 31250 + "context": 32000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-09", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", + "cost": { + "input": 0.05, + "output": 0.22, + "cache_read": 0.025, + "cache_write": 0.1 + } }, { - "id": "qwen2.5vl:7b", - "name": "Qwen2.5-VL 7B", - "display_name": "Qwen2.5-VL 7B", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen 3 235B Thinking", + "display_name": "Qwen 3 235B Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 125000, - "output": 31250 + "context": 262144, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", + "cost": { + "input": 0.11, + "output": 0.6, + "cache_read": 0.055, + "cache_write": 0.22 + } }, { - "id": "qwen2.5vl:32b", - "name": "Qwen2.5-VL 32B", - "display_name": "Qwen2.5-VL 32B", + "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen 3 Next 80B Instruct", + "display_name": "Qwen 3 Next 80B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 125000, - "output": 31250 + "context": 262144, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-10", + "last_updated": "2025-01-10", + "cost": { + "input": 0.1, + "output": 0.8, + "cache_read": 0.05, + "cache_write": 0.2 + } }, { - "id": "qwen2.5vl:72b", - "name": "Qwen2.5-VL 72B", - "display_name": "Qwen2.5-VL 72B", + "id": "zai-org/GLM-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 125000, - "output": 31250 + "context": 200000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-11-15", + "last_updated": "2024-11-15", + "cost": { + "input": 0.4, + "output": 1.75, + "cache_read": 0.2, + "cache_write": 0.8 + } }, { - "id": "nomic-embed-text:latest", - "name": "Nomic-Embed-Text Latest", - "display_name": "Nomic-Embed-Text Latest", + "id": "deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", "modalities": { "input": [ "text" @@ -63679,19 +62672,40 @@ ] }, "limit": { - "context": 2000, - "output": 0 + "context": 128000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "embedding" - }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-28", + "cost": { + "input": 2, + "output": 8.75, + "cache_read": 1, + "cache_write": 4 + } + } + ] + }, + "modelscope": { + "id": "modelscope", + "name": "ModelScope", + "display_name": "ModelScope", + "api": "https://api-inference.modelscope.cn/v1", + "doc": "https://modelscope.cn/docs/model-service/API-Inference/intro", + "models": [ { - "id": "nomic-embed-text:v1.5", - "name": "Nomic-Embed-Text v1.5", - "display_name": "Nomic-Embed-Text v1.5", + "id": "ZhipuAI/GLM-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ "text" @@ -63701,19 +62715,29 @@ ] }, "limit": { - "context": 2000, - "output": 0 + "context": 131072, + "output": 98304 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "embedding" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "nomic-embed-text:137m-v1.5-fp16", - "name": "Nomic-Embed-Text 137M v1.5 FP16", - "display_name": "Nomic-Embed-Text 137M v1.5 FP16", + "id": "ZhipuAI/GLM-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" @@ -63723,19 +62747,29 @@ ] }, "limit": { - "context": 2000, - "output": 0 + "context": 202752, + "output": 98304 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "embedding" + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "qwq:latest", - "name": "QwQ Latest", - "display_name": "QwQ Latest", + "id": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "name": "Qwen3 30B A3B Thinking 2507", + "display_name": "Qwen3 30B A3B Thinking 2507", "modalities": { "input": [ "text" @@ -63745,20 +62779,29 @@ ] }, "limit": { - "context": 40000, - "output": 10000 + "context": 262144, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "qwq:32b", - "name": "QwQ 32B", - "display_name": "QwQ 32B", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -63768,20 +62811,28 @@ ] }, "limit": { - "context": 40000, - "output": 10000 + "context": 262144, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2025-07-21", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "mistral:latest", - "name": "Mistral Latest", - "display_name": "Mistral Latest", + "id": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "name": "Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ "text" @@ -63791,19 +62842,28 @@ ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 262144, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-31", + "last_updated": "2025-07-31", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "mistral:7b", - "name": "Mistral 7B", - "display_name": "Mistral 7B", + "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "name": "Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ "text" @@ -63813,19 +62873,28 @@ ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 262144, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", + "cost": { + "input": 0, + "output": 0 + } }, { - "id": "mistral-large-3:675b-cloud", - "name": "Mistral Large 3 675B Cloud", - "display_name": "Mistral Large 3 675B Cloud", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3-235B-A22B-Thinking-2507", + "display_name": "Qwen3-235B-A22B-Thinking-2507", "modalities": { "input": [ "text" @@ -63835,42 +62904,68 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 262144, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" - }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", + "cost": { + "input": 0, + "output": 0 + } + } + ] + }, + "azure-cognitive-services": { + "id": "azure-cognitive-services", + "name": "Azure Cognitive Services", + "display_name": "Azure Cognitive Services", + "doc": "https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models", + "models": [ { - "id": "ministral-3:latest", - "name": "Ministral 3 Latest", - "display_name": "Ministral 3 Latest", + "id": "gpt-3.5-turbo-1106", + "name": "GPT-3.5 Turbo 1106", + "display_name": "GPT-3.5 Turbo 1106", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 16384, + "output": 16384 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2021-08", + "release_date": "2023-11-06", + "last_updated": "2023-11-06", + "cost": { + "input": 1, + "output": 2 + } }, { - "id": "ministral-3:3b", - "name": "Ministral 3 3B", - "display_name": "Ministral 3 3B", + "id": "mistral-small-2503", + "name": "Mistral Small 3.1", + "display_name": "Mistral Small 3.1", "modalities": { "input": [ "text", @@ -63881,23 +62976,31 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 128000, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-09", + "release_date": "2025-03-01", + "last_updated": "2025-03-01", + "cost": { + "input": 0.1, + "output": 0.3 + } }, { - "id": "ministral-3:8b", - "name": "Ministral 3 8B", - "display_name": "Ministral 3 8B", + "id": "codestral-2501", + "name": "Codestral 25.01", + "display_name": "Codestral 25.01", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -63907,61 +63010,89 @@ "context": 256000, "output": 256000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0.3, + "output": 0.9 + } }, { - "id": "ministral-3:14b", - "name": "Ministral 3 14B", - "display_name": "Ministral 3 14B", + "id": "mistral-large-2411", + "name": "Mistral Large 24.11", + "display_name": "Mistral Large 24.11", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 128000, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2024-09", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", + "cost": { + "input": 2, + "output": 6 + } }, { - "id": "ministral-3:3b-cloud", - "name": "Ministral 3 3B Cloud", - "display_name": "Ministral 3 3B Cloud", + "id": "gpt-5-pro", + "name": "GPT-5 Pro", + "display_name": "GPT-5 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 400000, + "output": 272000 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", + "cost": { + "input": 15, + "output": 120 + } }, { - "id": "ministral-3:8b-cloud", - "name": "Ministral 3 8B Cloud", - "display_name": "Ministral 3 8B Cloud", + "id": "deepseek-v3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ "text" @@ -63971,19 +63102,29 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 128000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "cost": { + "input": 0.58, + "output": 1.68 + } }, { - "id": "ministral-3:14b-cloud", - "name": "Ministral 3 14B Cloud", - "display_name": "Ministral 3 14B Cloud", + "id": "mai-ds-r1", + "name": "MAI-DS-R1", + "display_name": "MAI-DS-R1", "modalities": { "input": [ "text" @@ -63993,19 +63134,29 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 128000, + "output": 8192 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", + "cost": { + "input": 1.35, + "output": 5.4 + } }, { - "id": "ministral-3:3b-instruct-2512-q4_K_M", - "name": "Ministral 3 3B Instruct 2512 Q4_K_M", - "display_name": "Ministral 3 3B Instruct 2512 Q4_K_M", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ "text", @@ -64016,19 +63167,30 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 272000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.13 + } }, { - "id": "ministral-3:3b-instruct-2512-q8_0", - "name": "Ministral 3 3B Instruct 2512 Q8_0", - "display_name": "Ministral 3 3B Instruct 2512 Q8_0", + "id": "gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ "text", @@ -64039,42 +63201,61 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 128000, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 + } }, { - "id": "ministral-3:3b-instruct-2512-fp16", - "name": "Ministral 3 3B Instruct 2512 FP16", - "display_name": "Ministral 3 3B Instruct 2512 FP16", + "id": "phi-4-reasoning-plus", + "name": "Phi-4-reasoning-plus", + "display_name": "Phi-4-reasoning-plus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 32000, + "output": 4096 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "cost": { + "input": 0.125, + "output": 0.5 + } }, { - "id": "ministral-3:8b-instruct-2512-q4_K_M", - "name": "Ministral 3 8B Instruct 2512 Q4_K_M", - "display_name": "Ministral 3 8B Instruct 2512 Q4_K_M", + "id": "gpt-4-turbo-vision", + "name": "GPT-4 Turbo Vision", + "display_name": "GPT-4 Turbo Vision", "modalities": { "input": [ "text", @@ -64085,88 +63266,124 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 128000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", + "cost": { + "input": 10, + "output": 30 + } }, { - "id": "ministral-3:8b-instruct-2512-q8_0", - "name": "Ministral 3 8B Instruct 2512 Q8_0", - "display_name": "Ministral 3 8B Instruct 2512 Q8_0", + "id": "phi-4-reasoning", + "name": "Phi-4-reasoning", + "display_name": "Phi-4-reasoning", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 32000, + "output": 4096 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "cost": { + "input": 0.125, + "output": 0.5 + } }, { - "id": "ministral-3:8b-instruct-2512-fp16", - "name": "Ministral 3 8B Instruct 2512 FP16", - "display_name": "Ministral 3 8B Instruct 2512 FP16", + "id": "phi-3-medium-4k-instruct", + "name": "Phi-3-medium-instruct (4k)", + "display_name": "Phi-3-medium-instruct (4k)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 4096, + "output": 1024 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "cost": { + "input": 0.17, + "output": 0.68 + } }, { - "id": "ministral-3:14b-instruct-2512-q4_K_M", - "name": "Ministral 3 14B Instruct 2512 Q4_K_M", - "display_name": "Ministral 3 14B Instruct 2512 Q4_K_M", + "id": "codex-mini", + "name": "Codex Mini", + "display_name": "Codex Mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 200000, + "output": 100000 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-05-16", + "last_updated": "2025-05-16", + "cost": { + "input": 1.5, + "output": 6, + "cache_read": 0.375 + } }, { - "id": "ministral-3:14b-instruct-2512-q8_0", - "name": "Ministral 3 14B Instruct 2512 Q8_0", - "display_name": "Ministral 3 14B Instruct 2512 Q8_0", + "id": "o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ "text", @@ -64177,42 +63394,61 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 200000, + "output": 100000 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "cost": { + "input": 2, + "output": 8, + "cache_read": 0.5 + } }, { - "id": "ministral-3:14b-instruct-2512-fp16", - "name": "Ministral 3 14B Instruct 2512 FP16", - "display_name": "Ministral 3 14B Instruct 2512 FP16", + "id": "mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 128000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "cost": { + "input": 0.15, + "output": 0.15 + } }, { - "id": "qwen2.5:latest", - "name": "Qwen2.5 Latest", - "display_name": "Qwen2.5 Latest", + "id": "gpt-3.5-turbo-instruct", + "name": "GPT-3.5 Turbo Instruct", + "display_name": "GPT-3.5 Turbo Instruct", "modalities": { "input": [ "text" @@ -64222,19 +63458,28 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2021-08", + "release_date": "2023-09-21", + "last_updated": "2023-09-21", + "cost": { + "input": 1.5, + "output": 2 + } }, { - "id": "qwen2.5:0.5b", - "name": "Qwen2.5 0.5B", - "display_name": "Qwen2.5 0.5B", + "id": "meta-llama-3.1-8b-instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "display_name": "Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ "text" @@ -64247,16 +63492,25 @@ "context": 128000, "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 0.3, + "output": 0.61 + } }, { - "id": "qwen2.5:1.5b", - "name": "Qwen2.5 1.5B", - "display_name": "Qwen2.5 1.5B", + "id": "text-embedding-ada-002", + "name": "text-embedding-ada-002", + "display_name": "text-embedding-ada-002", "modalities": { "input": [ "text" @@ -64266,19 +63520,26 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 8192, + "output": 1536 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": false, + "release_date": "2022-12-15", + "last_updated": "2022-12-15", + "cost": { + "input": 0.1, + "output": 0 + } }, { - "id": "qwen2.5:3b", - "name": "Qwen2.5 3B", - "display_name": "Qwen2.5 3B", + "id": "cohere-embed-v3-english", + "name": "Embed v3 English", + "display_name": "Embed v3 English", "modalities": { "input": [ "text" @@ -64288,22 +63549,31 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 512, + "output": 1024 }, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "release_date": "2023-11-07", + "last_updated": "2023-11-07", + "cost": { + "input": 0.1, + "output": 0 + } }, { - "id": "qwen2.5:7b", - "name": "Qwen2.5 7B", - "display_name": "Qwen2.5 7B", + "id": "llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17B 16E Instruct", + "display_name": "Llama 4 Scout 17B 16E Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -64311,18 +63581,27 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "cost": { + "input": 0.2, + "output": 0.78 + } }, { - "id": "qwen2.5:14b", - "name": "Qwen2.5 14B", - "display_name": "Qwen2.5 14B", + "id": "o1-mini", + "name": "o1-mini", + "display_name": "o1-mini", "modalities": { "input": [ "text" @@ -64333,40 +63612,63 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 65536 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + } }, { - "id": "qwen2.5:32b", - "name": "Qwen2.5 32B", - "display_name": "Qwen2.5 32B", + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 272000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 0.25, + "output": 2, + "cache_read": 0.03 + } }, { - "id": "qwen2.5:72b", - "name": "Qwen2.5 72B", - "display_name": "Qwen2.5 72B", + "id": "phi-3.5-moe-instruct", + "name": "Phi-3.5-MoE-instruct", + "display_name": "Phi-3.5-MoE-instruct", "modalities": { "input": [ "text" @@ -64377,40 +63679,64 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 4096 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", + "cost": { + "input": 0.16, + "output": 0.64 + } }, { - "id": "llama3:latest", - "name": "Llama 3 Latest", - "display_name": "Llama 3 Latest", + "id": "gpt-5.1-chat", + "name": "GPT-5.1 Chat", + "display_name": "GPT-5.1 Chat", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { - "context": 8000, - "output": 2000 + "context": 128000, + "output": 16384 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125 + } }, { - "id": "llama3:8b", - "name": "Llama 3 8B", - "display_name": "Llama 3 8B", + "id": "grok-3-mini", + "name": "Grok 3 Mini", + "display_name": "Grok 3 Mini", "modalities": { "input": [ "text" @@ -64420,41 +63746,65 @@ ] }, "limit": { - "context": 8000, - "output": 2000 + "context": 131072, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", + "cost": { + "input": 0.3, + "output": 0.5, + "reasoning": 0.5, + "cache_read": 0.075 + } }, { - "id": "llama3:70b", - "name": "Llama 3 70B", - "display_name": "Llama 3 70B", + "id": "o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8000, - "output": 2000 + "context": 200000, + "output": 100000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", + "cost": { + "input": 15, + "output": 60, + "cache_read": 7.5 + } }, { - "id": "gemma2:latest", - "name": "Gemma 2 Latest", - "display_name": "Gemma 2 Latest", + "id": "meta-llama-3-8b-instruct", + "name": "Meta-Llama-3-8B-Instruct", + "display_name": "Meta-Llama-3-8B-Instruct", "modalities": { "input": [ "text" @@ -64467,82 +63817,126 @@ "context": 8192, "output": 2048 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", + "cost": { + "input": 0.3, + "output": 0.61 + } }, { - "id": "gemma2:2b", - "name": "Gemma 2 2B", - "display_name": "Gemma 2 2B", + "id": "phi-4-multimodal", + "name": "Phi-4-multimodal", + "display_name": "Phi-4-multimodal", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 128000, + "output": 4096 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "cost": { + "input": 0.08, + "output": 0.32, + "input_audio": 4 + } }, { - "id": "gemma2:9b", - "name": "Gemma 2 9B", - "display_name": "Gemma 2 9B", + "id": "o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 200000, + "output": 100000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 + } }, { - "id": "gemma2:27b", - "name": "Gemma 2 27B", - "display_name": "Gemma 2 27B", + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 1047576, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 2, + "output": 8, + "cache_read": 0.5 + } }, { - "id": "qwen2.5-coder:latest", - "name": "Qwen2.5-Coder Latest", - "display_name": "Qwen2.5-Coder Latest", + "id": "ministral-3b", + "name": "Ministral 3B", + "display_name": "Ministral 3B", "modalities": { "input": [ "text" @@ -64553,18 +63947,27 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-03", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "cost": { + "input": 0.04, + "output": 0.04 + } }, { - "id": "qwen2.5-coder:0.5b", - "name": "Qwen2.5-Coder 0.5B", - "display_name": "Qwen2.5-Coder 0.5B", + "id": "gpt-3.5-turbo-0301", + "name": "GPT-3.5 Turbo 0301", + "display_name": "GPT-3.5 Turbo 0301", "modalities": { "input": [ "text" @@ -64574,22 +63977,32 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2021-08", + "release_date": "2023-03-01", + "last_updated": "2023-03-01", + "cost": { + "input": 1.5, + "output": 2 + } }, { - "id": "qwen2.5-coder:1.5b", - "name": "Qwen2.5-Coder 1.5B", - "display_name": "Qwen2.5-Coder 1.5B", + "id": "gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -64597,18 +64010,28 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", + "cost": { + "input": 2.5, + "output": 10, + "cache_read": 1.25 + } }, { - "id": "qwen2.5-coder:3b", - "name": "Qwen2.5-Coder 3B", - "display_name": "Qwen2.5-Coder 3B", + "id": "phi-3-mini-128k-instruct", + "name": "Phi-3-mini-instruct (128k)", + "display_name": "Phi-3-mini-instruct (128k)", "modalities": { "input": [ "text" @@ -64619,21 +64042,31 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 4096 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "cost": { + "input": 0.13, + "output": 0.52 + } }, { - "id": "qwen2.5-coder:7b", - "name": "Qwen2.5-Coder 7B", - "display_name": "Qwen2.5-Coder 7B", + "id": "llama-3.2-90b-vision-instruct", + "name": "Llama-3.2-90B-Vision-Instruct", + "display_name": "Llama-3.2-90B-Vision-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -64641,84 +64074,132 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "cost": { + "input": 2.04, + "output": 2.04 + } }, { - "id": "qwen2.5-coder:14b", - "name": "Qwen2.5-Coder 14B", - "display_name": "Qwen2.5-Coder 14B", + "id": "gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 400000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.13 + } }, { - "id": "qwen2.5-coder:32b", - "name": "Qwen2.5-Coder 32B", - "display_name": "Qwen2.5-Coder 32B", + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 272000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 + } }, { - "id": "phi4:latest", - "name": "Phi-4 Latest", - "display_name": "Phi-4 Latest", + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { - "context": 16000, - "output": 4000 + "context": 272000, + "output": 128000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125 + } }, { - "id": "phi4:14b", - "name": "Phi-4 14B", - "display_name": "Phi-4 14B", + "id": "o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ "text" @@ -64728,41 +64209,60 @@ ] }, "limit": { - "context": 16000, - "output": 4000 + "context": 200000, + "output": 100000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + } }, { - "id": "gemma:latest", - "name": "Gemma Latest", - "display_name": "Gemma Latest", + "id": "model-router", + "name": "Model Router", + "display_name": "Model Router", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 128000, + "output": 16384 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-05-19", + "last_updated": "2025-11-18", + "cost": { + "input": 0.14, + "output": 0 + } }, { - "id": "gemma:2b", - "name": "Gemma 2B", - "display_name": "Gemma 2B", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -64772,41 +64272,64 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 262144, + "output": 262144 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" - }, - { - "id": "gemma:7b", - "name": "Gemma 7B", - "display_name": "Gemma 7B", + "attachment": false, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-12-02", + "cost": { + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 + } + }, + { + "id": "gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex Mini", + "display_name": "GPT-5.1 Codex Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "cost": { + "input": 0.25, + "output": 2, + "cache_read": 0.025 + } }, { - "id": "llama2:latest", - "name": "Llama 2 Latest", - "display_name": "Llama 2 Latest", + "id": "llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -64816,19 +64339,28 @@ ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 128000, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0.71, + "output": 0.71 + } }, { - "id": "llama2:7b", - "name": "Llama 2 7B", - "display_name": "Llama 2 7B", + "id": "o1-preview", + "name": "o1-preview", + "display_name": "o1-preview", "modalities": { "input": [ "text" @@ -64838,19 +64370,30 @@ ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 128000, + "output": 32768 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", + "cost": { + "input": 16.5, + "output": 66, + "cache_read": 8.25 + } }, { - "id": "llama2:13b", - "name": "Llama 2 13B", - "display_name": "Llama 2 13B", + "id": "phi-3.5-mini-instruct", + "name": "Phi-3.5-mini-instruct", + "display_name": "Phi-3.5-mini-instruct", "modalities": { "input": [ "text" @@ -64860,19 +64403,28 @@ ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 128000, + "output": 4096 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", + "cost": { + "input": 0.13, + "output": 0.52 + } }, { - "id": "llama2:70b", - "name": "Llama 2 70B", - "display_name": "Llama 2 70B", + "id": "gpt-3.5-turbo-0613", + "name": "GPT-3.5 Turbo 0613", + "display_name": "GPT-3.5 Turbo 0613", "modalities": { "input": [ "text" @@ -64882,22 +64434,32 @@ ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 16384, + "output": 16384 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2021-08", + "release_date": "2023-06-13", + "last_updated": "2023-06-13", + "cost": { + "input": 3, + "output": 4 + } }, { - "id": "qwen2:latest", - "name": "Qwen2 Latest", - "display_name": "Qwen2 Latest", + "id": "gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -64905,18 +64467,27 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", + "cost": { + "input": 10, + "output": 30 + } }, { - "id": "qwen2:0.5b", - "name": "Qwen2 0.5B", - "display_name": "Qwen2 0.5B", + "id": "meta-llama-3.1-70b-instruct", + "name": "Meta-Llama-3.1-70B-Instruct", + "display_name": "Meta-Llama-3.1-70B-Instruct", "modalities": { "input": [ "text" @@ -64929,16 +64500,25 @@ "context": 128000, "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 2.68, + "output": 3.54 + } }, { - "id": "qwen2:1.5b", - "name": "Qwen2 1.5B", - "display_name": "Qwen2 1.5B", + "id": "phi-3-small-8k-instruct", + "name": "Phi-3-small-instruct (8k)", + "display_name": "Phi-3-small-instruct (8k)", "modalities": { "input": [ "text" @@ -64948,19 +64528,28 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 8192, + "output": 2048 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "cost": { + "input": 0.15, + "output": 0.6 + } }, { - "id": "qwen2:7b", - "name": "Qwen2 7B", - "display_name": "Qwen2 7B", + "id": "deepseek-v3-0324", + "name": "DeepSeek-V3-0324", + "display_name": "DeepSeek-V3-0324", "modalities": { "input": [ "text" @@ -64970,19 +64559,28 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", + "cost": { + "input": 1.14, + "output": 4.56 + } }, { - "id": "qwen2:72b", - "name": "Qwen2 72B", - "display_name": "Qwen2 72B", + "id": "meta-llama-3-70b-instruct", + "name": "Meta-Llama-3-70B-Instruct", + "display_name": "Meta-Llama-3-70B-Instruct", "modalities": { "input": [ "text" @@ -64992,19 +64590,28 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 8192, + "output": 2048 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", + "cost": { + "input": 2.68, + "output": 3.54 + } }, { - "id": "deepseek-v3:latest", - "name": "DeepSeek-V3 Latest", - "display_name": "DeepSeek-V3 Latest", + "id": "text-embedding-3-large", + "name": "text-embedding-3-large", + "display_name": "text-embedding-3-large", "modalities": { "input": [ "text" @@ -65014,20 +64621,26 @@ ] }, "limit": { - "context": 160000, - "output": 40000 + "context": 8191, + "output": 3072 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": false, + "release_date": "2024-01-25", + "last_updated": "2024-01-25", + "cost": { + "input": 0.13, + "output": 0 + } }, { - "id": "deepseek-v3:671b", - "name": "DeepSeek-V3 671B", - "display_name": "DeepSeek-V3 671B", + "id": "grok-3", + "name": "Grok 3", + "display_name": "Grok 3", "modalities": { "input": [ "text" @@ -65037,20 +64650,29 @@ ] }, "limit": { - "context": 160000, - "output": 40000 + "context": 131072, + "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.75 + } }, { - "id": "llama3.3:latest", - "name": "Llama 3.3 Latest", - "display_name": "Llama 3.3 Latest", + "id": "gpt-3.5-turbo-0125", + "name": "GPT-3.5 Turbo 0125", + "display_name": "GPT-3.5 Turbo 0125", "modalities": { "input": [ "text" @@ -65060,41 +64682,64 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 16384, + "output": 16384 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2021-08", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", + "cost": { + "input": 0.5, + "output": 1.5 + } }, { - "id": "llama3.3:70b", - "name": "Llama 3.3 70B", - "display_name": "Llama 3.3 70B", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "bge-m3:latest", - "name": "BGE-M3 Latest", - "display_name": "BGE-M3 Latest", + "id": "phi-4-mini-reasoning", + "name": "Phi-4-mini-reasoning", + "display_name": "Phi-4-mini-reasoning", "modalities": { "input": [ "text" @@ -65104,19 +64749,29 @@ ] }, "limit": { - "context": 8192, - "output": 0 + "context": 128000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "embedding" + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "cost": { + "input": 0.075, + "output": 0.3 + } }, { - "id": "bge-m3:567m", - "name": "BGE-M3 567M", - "display_name": "BGE-M3 567M", + "id": "phi-4", + "name": "Phi-4", + "display_name": "Phi-4", "modalities": { "input": [ "text" @@ -65126,42 +64781,60 @@ ] }, "limit": { - "context": 8192, - "output": 0 + "context": 128000, + "output": 4096 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "type": "embedding" + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "cost": { + "input": 0.125, + "output": 0.5 + } }, { - "id": "llama3.2-vision:latest", - "name": "Llama 3.2 Vision Latest", - "display_name": "Llama 3.2 Vision Latest", + "id": "deepseek-v3.1", + "name": "DeepSeek-V3.1", + "display_name": "DeepSeek-V3.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", + "cost": { + "input": 0.56, + "output": 1.68 + } }, { - "id": "llama3.2-vision:11b", - "name": "Llama 3.2 Vision 11B", - "display_name": "Llama 3.2 Vision 11B", + "id": "gpt-5-chat", + "name": "GPT-5 Chat", + "display_name": "GPT-5 Chat", "modalities": { "input": [ "text", @@ -65173,18 +64846,29 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 16384 }, + "temperature": false, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-24", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.13 + } }, { - "id": "llama3.2-vision:90b", - "name": "Llama 3.2 Vision 90B", - "display_name": "Llama 3.2 Vision 90B", + "id": "gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ "text", @@ -65195,41 +64879,61 @@ ] }, "limit": { - "context": 128000, + "context": 1047576, "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 + } }, { - "id": "tinyllama:latest", - "name": "TinyLlama Latest", - "display_name": "TinyLlama Latest", + "id": "llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama 4 Maverick 17B 128E Instruct FP8", + "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 2048, - "output": 512 + "context": 128000, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "cost": { + "input": 0.25, + "output": 1 + } }, { - "id": "tinyllama:1.1b", - "name": "TinyLlama 1.1B", - "display_name": "TinyLlama 1.1B", + "id": "cohere-command-r-plus-08-2024", + "name": "Command R+", + "display_name": "Command R+", "modalities": { "input": [ "text" @@ -65239,21 +64943,31 @@ ] }, "limit": { - "context": 2048, - "output": 512 + "context": 128000, + "output": 4000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" - }, - { - "id": "starcoder2:latest", - "name": "StarCoder2 Latest", - "display_name": "StarCoder2 Latest", - "modalities": { - "input": [ + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", + "cost": { + "input": 2.5, + "output": 10 + } + }, + { + "id": "cohere-command-a", + "name": "Command A", + "display_name": "Command A", + "modalities": { + "input": [ "text" ], "output": [ @@ -65261,19 +64975,29 @@ ] }, "limit": { - "context": 16384, - "output": 4096 + "context": 256000, + "output": 8000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", + "cost": { + "input": 2.5, + "output": 10 + } }, { - "id": "starcoder2:3b", - "name": "StarCoder2 3B", - "display_name": "StarCoder2 3B", + "id": "phi-3-small-128k-instruct", + "name": "Phi-3-small-instruct (128k)", + "display_name": "Phi-3-small-instruct (128k)", "modalities": { "input": [ "text" @@ -65283,63 +65007,96 @@ ] }, "limit": { - "context": 16384, + "context": 128000, "output": 4096 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "cost": { + "input": 0.15, + "output": 0.6 + } }, { - "id": "starcoder2:7b", - "name": "StarCoder2 7B", - "display_name": "StarCoder2 7B", + "id": "claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 4096 + "context": 200000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + } }, { - "id": "starcoder2:15b", - "name": "StarCoder2 15B", - "display_name": "StarCoder2 15B", + "id": "mistral-medium-2505", + "name": "Mistral Medium 3", + "display_name": "Mistral Medium 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 4096 + "context": 128000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", + "cost": { + "input": 0.4, + "output": 2 + } }, { - "id": "codegemma:latest", - "name": "CodeGemma Latest", - "display_name": "CodeGemma Latest", + "id": "deepseek-v3.2-speciale", + "name": "DeepSeek-V3.2-Speciale", + "display_name": "DeepSeek-V3.2-Speciale", "modalities": { "input": [ "text" @@ -65349,41 +65106,65 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 128000, + "output": 128000 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "cost": { + "input": 0.58, + "output": 1.68 + } }, { - "id": "codegemma:2b", - "name": "CodeGemma 2B", - "display_name": "CodeGemma 2B", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 200000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "cost": { + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 + } }, { - "id": "codegemma:7b", - "name": "CodeGemma 7B", - "display_name": "CodeGemma 7B", + "id": "phi-3-mini-4k-instruct", + "name": "Phi-3-mini-instruct (4k)", + "display_name": "Phi-3-mini-instruct (4k)", "modalities": { "input": [ "text" @@ -65393,19 +65174,65 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 4096, + "output": 1024 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "cost": { + "input": 0.13, + "output": 0.52 + } }, { - "id": "kimi-k2-thinking:cloud", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", + "modalities": { + "input": [ + "text", + "image", + "audio" + ], + "output": [ + "text", + "image", + "audio" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125 + } + }, + { + "id": "grok-code-fast-1", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ "text" @@ -65416,7 +65243,7 @@ }, "limit": { "context": 256000, - "output": 8192 + "output": 10000 }, "temperature": true, "tool_call": true, @@ -65425,43 +65252,52 @@ "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-11-06", - "last_updated": "2025-11-06", - "type": "chat" + "open_weights": false, + "knowledge": "2023-10", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", + "cost": { + "input": 0.2, + "output": 1.5, + "cache_read": 0.02 + } }, { - "id": "qwen3-vl-235b-cloud", - "name": "Qwen3-VL 235B Instruct", - "display_name": "Qwen3-VL 235B Instruct", + "id": "deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 163840, + "output": 163840 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-09-22", - "last_updated": "2025-09-22", - "type": "chat" + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", + "cost": { + "input": 1.35, + "output": 5.4 + } }, { - "id": "cogito-2.1:671b-cloud", - "name": "Cogito 2.1 671B", - "display_name": "Cogito 2.1 671B", + "id": "meta-llama-3.1-405b-instruct", + "name": "Meta-Llama-3.1-405B-Instruct", + "display_name": "Meta-Llama-3.1-405B-Instruct", "modalities": { "input": [ "text" @@ -65471,8 +65307,8 @@ ] }, "limit": { - "context": 160000, - "output": 8192 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -65481,14 +65317,18 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-11-19", - "last_updated": "2025-11-19", - "type": "chat" + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 5.33, + "output": 16 + } }, { - "id": "qwen3-vl-235b-instruct-cloud", - "name": "Qwen3-VL 235B Instruct", - "display_name": "Qwen3-VL 235B Instruct", + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ "text", @@ -65499,24 +65339,30 @@ ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-09-22", - "last_updated": "2025-09-22", - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", + "cost": { + "input": 1.75, + "output": 14, + "cache_read": 0.175 + } }, { - "id": "kimi-k2:1t-cloud", - "name": "Kimi K2", - "display_name": "Kimi K2", + "id": "gpt-4-32k", + "name": "GPT-4 32K", + "display_name": "GPT-4 32K", "modalities": { "input": [ "text" @@ -65526,8 +65372,8 @@ ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -65535,15 +65381,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-09-05", - "last_updated": "2025-09-05", - "type": "chat" + "open_weights": false, + "knowledge": "2023-11", + "release_date": "2023-03-14", + "last_updated": "2023-03-14", + "cost": { + "input": 60, + "output": 120 + } }, { - "id": "minimax-m2:cloud", - "name": "MiniMax M2", - "display_name": "MiniMax M2", + "id": "phi-4-mini", + "name": "Phi-4-mini", + "display_name": "Phi-4-mini", "modalities": { "input": [ "text" @@ -65553,8 +65403,8 @@ ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -65563,50 +65413,48 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", - "type": "chat" - } - ] - }, - "burncloud": { - "id": "burncloud", - "name": "burncloud", - "display_name": "burncloud", - "models": [ + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "cost": { + "input": 0.075, + "output": 0.3 + } + }, { - "id": "openai/gpt-4-turbo", - "name": "OpenAI GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "cohere-embed-v3-multilingual", + "name": "Embed v3 Multilingual", + "display_name": "Embed v3 Multilingual", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000 + "context": 512, + "output": 1024 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, + "open_weights": true, + "release_date": "2023-11-07", + "last_updated": "2023-11-07", "cost": { - "input": 8, - "output": 24 - }, - "type": "chat" + "input": 0.1, + "output": 0 + } }, { - "id": "openai/o4-mini", - "name": "OpenAI o4-mini", - "display_name": "o4-mini", + "id": "grok-4", + "name": "Grok 4", + "display_name": "Grok 4", "modalities": { "input": [ "text" @@ -65616,7 +65464,8 @@ ] }, "limit": { - "output": 100000 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -65624,17 +65473,22 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.88, - "output": 3.52 - }, - "type": "chat" + "input": 3, + "output": 15, + "reasoning": 15, + "cache_read": 0.75 + } }, { - "id": "openai/o3", - "name": "OpenAI o3", - "display_name": "o3", + "id": "cohere-command-r-08-2024", + "name": "Command R", + "display_name": "Command R", "modalities": { "input": [ "text" @@ -65644,7 +65498,8 @@ ] }, "limit": { - "output": 100000 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, @@ -65652,111 +65507,130 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 8, - "output": 35 - }, - "type": "chat" + "input": 0.15, + "output": 0.6 + } }, { - "id": "openai/o3-mini", - "name": "OpenAI o3-mini", - "display_name": "o3-mini", + "id": "cohere-embed-v-4-0", + "name": "Embed v4", + "display_name": "Embed v4", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "output": 100000 + "context": 128000, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, + "open_weights": true, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.88, - "output": 3.52 - }, - "type": "chat" + "input": 0.12, + "output": 0 + } }, { - "id": "openai/o1", - "name": "OpenAI o1", - "display_name": "o1", + "id": "llama-3.2-11b-vision-instruct", + "name": "Llama-3.2-11B-Vision-Instruct", + "display_name": "Llama-3.2-11B-Vision-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "output": 100000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 12, - "output": 48 - }, - "type": "chat" + "input": 0.37, + "output": 0.37 + } }, { - "id": "openai/o1-mini", - "name": "OpenAI o1-mini", - "display_name": "o1-mini", + "id": "gpt-5.2-chat", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "output": 65536 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "cost": { - "input": 0.88, - "output": 3.52 - }, - "type": "chat" + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 1.75, + "output": 14, + "cache_read": 0.175 + } }, { - "id": "openai/o1-pro", - "name": "OpenAI o1-pro", - "display_name": "o1-pro", + "id": "claude-opus-4-1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "output": 100000 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -65765,49 +65639,55 @@ "default": true }, "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 120, - "output": 480 - }, - "type": "chat" + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } }, { - "id": "openai/gpt-4.1", - "name": "OpenAI GPT-4.1", - "display_name": "GPT-4.1", + "id": "gpt-4", + "name": "GPT-4", + "display_name": "GPT-4", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "output": 32768 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, + "open_weights": false, + "knowledge": "2023-11", + "release_date": "2023-03-14", + "last_updated": "2023-03-14", "cost": { - "input": 1.6, - "output": 6.4 - }, - "type": "chat" + "input": 60, + "output": 120 + } }, { - "id": "openai/gpt-4o", - "name": "OpenAI GPT-4o", - "display_name": "GPT-4o", + "id": "phi-3-medium-128k-instruct", + "name": "Phi-3-medium-instruct (128k)", + "display_name": "Phi-3-medium-instruct (128k)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -65815,37 +65695,39 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 2, - "output": 8 - }, - "type": "chat" + "input": 0.17, + "output": 0.68 + } }, { - "id": "openai/gpt-4o-audio", - "name": "OpenAI GPT-4o Audio", - "display_name": "GPT-4o Audio", + "id": "grok-4-fast-reasoning", + "name": "Grok 4 Fast (Reasoning)", + "display_name": "Grok 4 Fast (Reasoning)", "modalities": { "input": [ "text", - "audio" + "image" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "output": 16384 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -65854,28 +65736,31 @@ "default": true }, "attachment": true, + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 2, - "output": 8 - }, - "type": "chat" + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + } }, { - "id": "openai/gpt-4o-mini", - "name": "OpenAI GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "deepseek-r1-0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, @@ -65883,224 +65768,281 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.12, - "output": 0.48 - }, - "type": "chat" + "input": 1.35, + "output": 5.4 + } }, { - "id": "openai/gpt-4o-mini-audio", - "name": "OpenAI GPT-4o mini Audio", - "display_name": "GPT-4o mini Audio", + "id": "grok-4-fast-non-reasoning", + "name": "Grok 4 Fast (Non-Reasoning)", + "display_name": "Grok 4 Fast (Non-Reasoning)", "modalities": { "input": [ "text", - "audio" + "image" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "output": 16384 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 0.12, - "output": 0.48 - }, - "type": "chat" + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + } }, { - "id": "openai/gpt-4o-realtime", - "name": "OpenAI GPT-4o Realtime", - "display_name": "GPT-4o Realtime", + "id": "text-embedding-3-small", + "name": "text-embedding-3-small", + "display_name": "text-embedding-3-small", "modalities": { "input": [ - "text", - "audio" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "output": 4096 + "context": 8191, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, + "open_weights": false, + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 4, - "output": 16 - }, - "type": "chat" + "input": 0.02, + "output": 0 + } }, { - "id": "openai/gpt-4o-mini-realtime", - "name": "OpenAI GPT-4o mini Realtime", - "display_name": "GPT-4o mini Realtime", + "id": "gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ "text", - "audio" + "image" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "output": 4096 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.48, - "output": 1.92 - }, - "type": "chat" - }, + "input": 0.1, + "output": 0.4, + "cache_read": 0.03 + } + } + ] + }, + "llama": { + "id": "llama", + "name": "Llama", + "display_name": "Llama", + "api": "https://api.llama.com/compat/v1/", + "doc": "https://llama.developer.meta.com/docs/models", + "models": [ { - "id": "openai/gpt-image-1", - "name": "OpenAI GPT Image 1", - "display_name": "GPT Image 1", + "id": "llama-3.3-8b-instruct", + "name": "Llama-3.3-8B-Instruct", + "display_name": "Llama-3.3-8B-Instruct", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, + "limit": { + "context": 128000, + "output": 4096 + }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 4, - "output": 32 - }, - "type": "imageGeneration" + "input": 0, + "output": 0 + } }, { - "id": "openai/gpt-4o-mini-tts", - "name": "OpenAI GPT-4o mini TTS", - "display_name": "GPT-4o mini TTS", + "id": "llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "audio" + "text" ] }, - "temperature": false, - "tool_call": false, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.48, - "output": 0.96 + "input": 0, + "output": 0 } }, { - "id": "openai/tts-1-hd", - "name": "OpenAI TTS-1 HD", - "display_name": "TTS-1 HD", + "id": "llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, - "temperature": false, - "tool_call": false, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 24 + "input": 0, + "output": 0 } }, { - "id": "openai/gpt-4o-transcribe", - "name": "OpenAI GPT-4o Transcribe", - "display_name": "GPT-4o Transcribe", + "id": "llama-4-scout-17b-16e-instruct-fp8", + "name": "Llama-4-Scout-17B-16E-Instruct-FP8", + "display_name": "Llama-4-Scout-17B-16E-Instruct-FP8", "modalities": { "input": [ - "audio" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "output": 2000 + "context": 128000, + "output": 4096 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 2, - "output": 8 + "input": 0, + "output": 0 } }, { - "id": "openai/whisper", - "name": "OpenAI Whisper", - "display_name": "Whisper", + "id": "groq-llama-4-maverick-17b-128e-instruct", + "name": "Groq-Llama-4-Maverick-17B-128E-Instruct", + "display_name": "Groq-Llama-4-Maverick-17B-128E-Instruct", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, - "temperature": false, - "tool_call": false, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.0048 + "input": 0, + "output": 0 } }, { - "id": "openai/gpt-4o-search-preview", - "name": "OpenAI GPT-4o Search Preview", - "display_name": "GPT-4o Search Preview", + "id": "cerebras-llama-4-scout-17b-16e-instruct", + "name": "Cerebras-Llama-4-Scout-17B-16E-Instruct", + "display_name": "Cerebras-Llama-4-Scout-17B-16E-Instruct", "modalities": { "input": [ "text" @@ -66110,25 +66052,28 @@ ] }, "limit": { - "output": 16384 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 2, - "output": 8 - }, - "type": "chat" + "input": 0, + "output": 0 + } }, { - "id": "openai/computer-use-preview", - "name": "OpenAI Computer Use Preview", - "display_name": "computer-use-preview", + "id": "cerebras-llama-4-maverick-17b-128e-instruct", + "name": "Cerebras-Llama-4-Maverick-17B-128E-Instruct", + "display_name": "Cerebras-Llama-4-Maverick-17B-128E-Instruct", "modalities": { "input": [ "text" @@ -66138,83 +66083,97 @@ ] }, "limit": { - "output": 1024 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 2.4, - "output": 9.6 - }, - "type": "chat" - }, + "input": 0, + "output": 0 + } + } + ] + }, + "scaleway": { + "id": "scaleway", + "name": "Scaleway", + "display_name": "Scaleway", + "api": "https://api.scaleway.ai/v1", + "doc": "https://www.scaleway.com/en/docs/generative-apis/", + "models": [ { - "id": "google/gemini-2.5-pro", - "name": "Google Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "output": 65536 + "context": 260000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, + "open_weights": true, + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 1, - "output": 8 - }, - "type": "chat" + "input": 0.75, + "output": 2.25 + } }, { - "id": "google/gemini-2.5-flash", - "name": "Google Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "devstral-2-123b-instruct-2512", + "name": "Devstral 2 123B Instruct (2512)", + "display_name": "Devstral 2 123B Instruct (2512)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "output": 65536 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, + "open_weights": true, + "release_date": "2026-01-07", + "last_updated": "2026-01-07", "cost": { - "input": 0.12, - "output": 0.48 - }, - "type": "chat" + "input": 0.4, + "output": 2 + } }, { - "id": "google/gemini-2.0-flash", - "name": "Google Gemini 2.0 Flash", - "display_name": "Gemini 2.0 Flash", + "id": "pixtral-12b-2409", + "name": "Pixtral 12B 2409", + "display_name": "Pixtral 12B 2409", "modalities": { "input": [ "text", @@ -66225,71 +66184,88 @@ ] }, "limit": { - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, + "open_weights": true, + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.08, - "output": 0.32 - }, - "type": "chat" + "input": 0.2, + "output": 0.2 + } }, { - "id": "google/imagen-3", - "name": "Google Imagen 3", - "display_name": "Imagen 3", + "id": "llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, + "limit": { + "context": 128000, + "output": 16384 + }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.024 - }, - "type": "imageGeneration" + "input": 0.2, + "output": 0.2 + } }, { - "id": "google/veo-2", - "name": "Google Veo 2", - "display_name": "Veo 2", + "id": "mistral-nemo-instruct-2407", + "name": "Mistral Nemo Instruct 2407", + "display_name": "Mistral Nemo Instruct 2407", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "video" + "text" ] }, + "limit": { + "context": 128000, + "output": 8192 + }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, + "open_weights": true, + "release_date": "2024-07-25", + "last_updated": "2024-07-25", "cost": { - "input": 0.28 + "input": 0.2, + "output": 0.2 } }, { - "id": "anthropic/claude-sonnet-4", - "name": "Anthropic Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "mistral-small-3.2-24b-instruct-2506", + "name": "Mistral Small 3.2 24B Instruct (2506)", + "display_name": "Mistral Small 3.2 24B Instruct (2506)", "modalities": { "input": [ "text", @@ -66300,114 +66276,120 @@ ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, + "open_weights": true, + "release_date": "2025-06-20", + "last_updated": "2025-06-20", "cost": { - "input": 2.4, - "output": 12 - }, - "type": "chat" + "input": 0.15, + "output": 0.35 + } }, { - "id": "anthropic/claude-opus-4", - "name": "Anthropic Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder 30B-A3B Instruct", + "display_name": "Qwen3-Coder 30B-A3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 12, - "output": 60 - }, - "type": "chat" + "input": 0.2, + "output": 0.8 + } }, { - "id": "anthropic/claude-3.7-sonnet", - "name": "Anthropic Claude 3.7 Sonnet", - "display_name": "Claude 3.7 Sonnet", + "id": "llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 100000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 2.4, - "output": 12 - }, - "type": "chat" + "input": 0.9, + "output": 0.9 + } }, { - "id": "anthropic/claude-3.5-haiku", - "name": "Anthropic Claude 3.5 Haiku", - "display_name": "Claude 3.5 Haiku", + "id": "whisper-large-v3", + "name": "Whisper Large v3", + "display_name": "Whisper Large v3", "modalities": { "input": [ - "text", - "image" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000 + "context": 0, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, + "open_weights": true, + "knowledge": "2023-09", + "release_date": "2023-09-01", + "last_updated": "2025-09-05", "cost": { - "input": 0.64, - "output": 3.2 - }, - "type": "chat" + "input": 0.003, + "output": 0 + } }, { - "id": "xai/grok-3", - "name": "xAI Grok-3", - "display_name": "Grok-3", + "id": "deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ "text" @@ -66417,7 +66399,8 @@ ] }, "limit": { - "output": 8192 + "context": 32000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -66425,45 +66408,51 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 2.4, - "output": 12 - }, - "type": "chat" + "input": 0.9, + "output": 0.9 + } }, { - "id": "xai/grok-3-mini", - "name": "xAI Grok-3 Mini", - "display_name": "Grok-3 Mini", + "id": "voxtral-small-24b-2507", + "name": "Voxtral Small 24B 2507", + "display_name": "Voxtral Small 24B 2507", "modalities": { "input": [ - "text" + "text", + "audio" ], "output": [ "text" ] }, "limit": { - "output": 4096 + "context": 32000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, + "open_weights": true, + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 0.24, - "output": 0.4 - }, - "type": "chat" + "input": 0.15, + "output": 0.35 + } }, { - "id": "deepseek/deepseek-r1", - "name": "DeepSeek Reasoner", - "display_name": "DeepSeek R1", + "id": "gpt-oss-120b", + "name": "GPT-OSS 120B", + "display_name": "GPT-OSS 120B", "modalities": { "input": [ "text" @@ -66473,25 +66462,27 @@ ] }, "limit": { + "context": 128000, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, + "open_weights": true, + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "cost": { - "input": 0.1104, - "output": 1.7632 - }, - "type": "chat" + "input": 0.15, + "output": 0.6 + } }, { - "id": "deepseek/deepseek-chat", - "name": "DeepSeek Chat", - "display_name": "DeepSeek Chat", + "id": "bge-multilingual-gemma2", + "name": "BGE Multilingual Gemma2", + "display_name": "BGE Multilingual Gemma2", "modalities": { "input": [ "text" @@ -66501,32 +66492,27 @@ ] }, "limit": { - "output": 8192 + "context": 8191, + "output": 3072 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, + "open_weights": false, + "release_date": "2024-07-26", + "last_updated": "2025-06-15", "cost": { - "input": 0.0552, - "output": 0.8816 - }, - "type": "chat" - } - ] - }, - "cherryin": { - "id": "cherryin", - "name": "cherryin", - "display_name": "cherryin", - "models": [ + "input": 0.13, + "output": 0 + } + }, { - "id": "anthropic/claude-opus-4.5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "gemma-3-27b-it", + "name": "Gemma-3-27B-IT", + "display_name": "Gemma-3-27B-IT", "modalities": { "input": [ "text", @@ -66537,30 +66523,42 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 40000, + "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "attachment": true, "open_weights": false, + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2025-09-05", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5 - }, - "type": "chat" - }, + "input": 0.25, + "output": 0.5 + } + } + ] + }, + "amazon-bedrock": { + "id": "amazon-bedrock", + "name": "Amazon Bedrock", + "display_name": "Amazon Bedrock", + "doc": "https://docs.aws.amazon.com/bedrock/latest/userguide/models-supported.html", + "models": [ { - "id": "anthropic/claude-3.7-sonnet", - "name": "Anthropic: Claude 3.7 Sonnet", - "display_name": "Anthropic: Claude 3.7 Sonnet", + "id": "us.anthropic.claude-sonnet-4-5-20250929-v1:0", + "name": "Claude Sonnet 4.5 (US)", + "display_name": "Claude Sonnet 4.5 (US)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -66570,7 +66568,7 @@ "context": 200000, "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -66578,45 +66576,53 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-01", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", - "type": "chat" + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "anthropic/claude-haiku-4.5", - "name": "Anthropic: claude-haiku-4-5", - "display_name": "Anthropic: claude-haiku-4-5", + "id": "cohere.command-r-plus-v1:0", + "name": "Command R+", + "display_name": "Command R+", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-04-04", + "last_updated": "2024-04-04", + "cost": { + "input": 3, + "output": 15 + } }, { - "id": "anthropic/claude-opus-4", - "name": "Anthropic: Claude Opus 4", - "display_name": "Anthropic: Claude Opus 4", + "id": "anthropic.claude-v2", + "name": "Claude 2", + "display_name": "Claude 2", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -66624,30 +66630,33 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 100000, + "output": 4096 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "type": "chat" + "knowledge": "2023-08", + "release_date": "2023-07-11", + "last_updated": "2023-07-11", + "cost": { + "input": 8, + "output": 24 + } }, { - "id": "anthropic/claude-opus-4.1", - "name": "Anthropic: Claude Opus 4.1", - "display_name": "Anthropic: Claude Opus 4.1", + "id": "anthropic.claude-3-7-sonnet-20250219-v1:0", + "name": "Claude Sonnet 3.7", + "display_name": "Claude Sonnet 3.7", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ "text" @@ -66655,39 +66664,44 @@ }, "limit": { "context": 200000, - "output": 32000 + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "type": "chat" + "knowledge": "2024-04", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "anthropic/claude-sonnet-4", - "name": "Anthropic: Claude Sonnet 4", - "display_name": "Anthropic: Claude Sonnet 4", + "id": "anthropic.claude-sonnet-4-20250514-v1:0", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 200000, "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -66695,83 +66709,82 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", + "knowledge": "2024-04", "release_date": "2025-05-22", "last_updated": "2025-05-22", - "type": "chat" + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "anthropic/claude-sonnet-4.5", - "name": "Anthropic: Claude Sonnet 4.5", - "display_name": "Anthropic: Claude Sonnet 4.5", + "id": "qwen.qwen3-coder-30b-a3b-v1:0", + "name": "Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", - "type": "chat" - }, - { - "id": "bytedance/seed-oss-36b-instruct", - "name": "ByteDance: Seed OSS 36B Instruct", - "display_name": "ByteDance: Seed OSS 36B Instruct", - "limit": { - "context": 4096, - "output": 4096 - }, - "tool_call": false, - "reasoning": { - "supported": false + "knowledge": "2024-04", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", + "cost": { + "input": 0.15, + "output": 0.6 } }, { - "id": "deepseek/deepseek-r1-0528", - "name": "DeepSeek: R1 0528", - "display_name": "DeepSeek: R1 0528", + "id": "google.gemma-3-4b-it", + "name": "Gemma 3 4B IT", + "display_name": "Gemma 3 4B IT", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "cost": { + "input": 0.04, + "output": 0.08 + } }, { - "id": "deepseek/deepseek-v3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "minimax.minimax-m2", + "name": "MiniMax M2", + "display_name": "MiniMax M2", "modalities": { "input": [ "text" @@ -66781,8 +66794,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 204608, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -66791,40 +66804,50 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-08-20", - "last_updated": "2025-08-26", - "type": "chat" - }, - { - "id": "deepseek/deepseek-v3.1-fast", - "name": "DeepSeek: DeepSeek V3.1 (free)", - "display_name": "DeepSeek: DeepSeek V3.1 (free)", + "open_weights": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", + "cost": { + "input": 0.3, + "output": 1.2 + } + }, + { + "id": "meta.llama3-2-11b-instruct-v1:0", + "name": "Llama 3.2 11B Instruct", + "display_name": "Llama 3.2 11B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163800 + "context": 128000, + "output": 4096 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "cost": { + "input": 0.16, + "output": 0.16 + } }, { - "id": "deepseek/deepseek-v3.1-terminus", - "name": "DeepSeek: DeepSeek V3.1 Terminus", - "display_name": "DeepSeek: DeepSeek V3.1 Terminus", + "id": "qwen.qwen3-next-80b-a3b", + "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Next-80B-A3B-Instruct", "modalities": { "input": [ "text" @@ -66834,247 +66857,295 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 262000, + "output": 262000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-09-22", - "last_updated": "2025-09-22", - "type": "chat" + "open_weights": false, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", + "cost": { + "input": 0.14, + "output": 1.4 + } }, { - "id": "deepseek/deepseek-v3.2-exp", - "name": "DeepSeek: DeepSeek V3.2 Exp", - "display_name": "DeepSeek: DeepSeek V3.2 Exp", + "id": "anthropic.claude-3-haiku-20240307-v1:0", + "name": "Claude Haiku 3", + "display_name": "Claude Haiku 3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 163840 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-02", + "release_date": "2024-03-13", + "last_updated": "2024-03-13", + "cost": { + "input": 0.25, + "output": 1.25 + } }, { - "id": "google/gemini-2.5-flash", - "name": "Google: Gemini 2.5 Flash", - "display_name": "Google: Gemini 2.5 Flash", + "id": "meta.llama3-2-90b-instruct-v1:0", + "name": "Llama 3.2 90B Instruct", + "display_name": "Llama 3.2 90B Instruct", "modalities": { "input": [ - "image", "text", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-07-17", - "last_updated": "2025-07-17", - "type": "chat" + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "cost": { + "input": 0.72, + "output": 0.72 + } }, { - "id": "google/gemini-2.5-flash-image", - "name": "Google: Gemini 2.5 Flash Image (Nano Banana)", - "display_name": "Google: Gemini 2.5 Flash Image (Nano Banana)", + "id": "qwen.qwen3-vl-235b-a22b", + "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "display_name": "Qwen/Qwen3-VL-235B-A22B-Instruct", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ - "image", "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 262000, + "output": 262000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "type": "imageGeneration" + "attachment": true, + "open_weights": false, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", + "cost": { + "input": 0.3, + "output": 1.5 + } }, { - "id": "google/gemini-2.5-flash-image-preview", - "name": "Google: Gemini 2.5 Flash Image Preview (Nano Banana)", - "display_name": "Google: Gemini 2.5 Flash Image Preview (Nano Banana)", + "id": "meta.llama3-2-1b-instruct-v1:0", + "name": "Llama 3.2 1B Instruct", + "display_name": "Llama 3.2 1B Instruct", "modalities": { "input": [ - "image", "text" ], "output": [ - "image", "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 131000, + "output": 4096 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "type": "imageGeneration" + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "cost": { + "input": 0.1, + "output": 0.1 + } }, { - "id": "google/gemini-2.5-flash-lite", - "name": "Google: Gemini 2.5 Flash Lite", - "display_name": "Google: Gemini 2.5 Flash Lite", + "id": "us.anthropic.claude-opus-4-6-v1", + "name": "Claude Opus 4.6 (US)", + "display_name": "Claude Opus 4.6 (US)", "modalities": { "input": [ - "image", "text", - "audio" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 1000000, + "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "type": "chat" + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25, + "context_over_200k": { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5 + } + } }, { - "id": "google/gemini-2.5-pro", - "name": "Google: Gemini 2.5 Pro", - "display_name": "Google: Gemini 2.5 Pro", + "id": "anthropic.claude-v2:1", + "name": "Claude 2.1", + "display_name": "Claude 2.1", "modalities": { "input": [ - "image", - "text", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 4096 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", - "type": "chat" + "knowledge": "2023-08", + "release_date": "2023-11-21", + "last_updated": "2023-11-21", + "cost": { + "input": 8, + "output": 24 + } }, { - "id": "google/gemini-3-pro-preview", - "name": "Google: Gemini 3 Pro Preview", - "display_name": "Google: Gemini 3 Pro Preview", + "id": "deepseek.v3-v1:0", + "name": "DeepSeek-V3.1", + "display_name": "DeepSeek-V3.1", "modalities": { "input": [ - "image", - "text", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 163840, + "output": 81920 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-10", - "release_date": "2025-11-19", - "last_updated": "2025-11-19", - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", + "cost": { + "input": 0.58, + "output": 1.68 + } }, { - "id": "inclusionai/ling-1t", - "name": "inclusionAI: Ling-1T", - "display_name": "inclusionAI: Ling-1T", + "id": "anthropic.claude-opus-4-5-20251101-v1:0", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + } }, { - "id": "meituan/longcat-flash-chat", - "name": "Meituan: LongCat-Flash-Chat", - "display_name": "Meituan: LongCat-Flash-Chat", + "id": "cohere.command-light-text-v14", + "name": "Command Light", + "display_name": "Command Light", "modalities": { "input": [ "text" @@ -67083,19 +67154,29 @@ "text" ] }, + "limit": { + "context": 4096, + "output": 4096 + }, "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "type": "chat" + "open_weights": true, + "knowledge": "2023-08", + "release_date": "2023-11-01", + "last_updated": "2023-11-01", + "cost": { + "input": 0.3, + "output": 0.6 + } }, { - "id": "minimax/minimax-m2", - "name": "MiniMax: minimax-m2", - "display_name": "MiniMax: minimax-m2", + "id": "mistral.mistral-large-2402-v1:0", + "name": "Mistral Large (24.02)", + "display_name": "Mistral Large (24.02)", "modalities": { "input": [ "text" @@ -67105,101 +67186,122 @@ ] }, "limit": { - "context": 204800, - "output": 192000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "type": "chat" + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "cost": { + "input": 0.5, + "output": 1.5 + } }, { - "id": "minimaxai/minimax-m1-80k", - "name": "MiniMax: MiniMax M1", - "display_name": "MiniMax: MiniMax M1", + "id": "google.gemma-3-27b-it", + "name": "Google Gemma 3 27B Instruct", + "display_name": "Google Gemma 3 27B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 40000 + "context": 202752, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-07-27", + "last_updated": "2025-07-27", + "cost": { + "input": 0.12, + "output": 0.2 + } }, { - "id": "moonshotai/kimi-k2-0905", - "name": "MoonshotAI: Kimi K2 0905", - "display_name": "MoonshotAI: Kimi K2 0905", + "id": "nvidia.nemotron-nano-12b-v2", + "name": "NVIDIA Nemotron Nano 12B v2 VL BF16", + "display_name": "NVIDIA Nemotron Nano 12B v2 VL BF16", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", - "type": "chat" + "open_weights": false, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "cost": { + "input": 0.2, + "output": 0.6 + } }, { - "id": "moonshotai/kimi-k2-thinking", - "name": "MoonshotAI: kimi-k2-thinking", - "display_name": "MoonshotAI: kimi-k2-thinking", + "id": "google.gemma-3-12b-it", + "name": "Google Gemma 3 12B", + "display_name": "Google Gemma 3 12B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "type": "chat" + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "cost": { + "input": 0.049999999999999996, + "output": 0.09999999999999999 + } }, { - "id": "moonshotai/kimi-k2-thinking-turbo", - "name": "MoonshotAI: kimi-k2-thinking", - "display_name": "MoonshotAI: kimi-k2-thinking", + "id": "ai21.jamba-1-5-large-v1:0", + "name": "Jamba 1.5 Large", + "display_name": "Jamba 1.5 Large", "modalities": { "input": [ "text" @@ -67209,136 +67311,175 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "type": "chat" + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2024-08-15", + "last_updated": "2024-08-15", + "cost": { + "input": 2, + "output": 8 + } }, { - "id": "openai/gpt-4.1", - "name": "OpenAI: GPT-4.1", - "display_name": "OpenAI: GPT-4.1", + "id": "eu.anthropic.claude-haiku-4-5-20251001-v1:0", + "name": "Claude Haiku 4.5 (EU)", + "display_name": "Claude Haiku 4.5 (EU)", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "type": "chat" + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "cost": { + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 + } }, { - "id": "openai/gpt-4.1-mini", - "name": "OpenAI: GPT-4.1 Mini", - "display_name": "OpenAI: GPT-4.1 Mini", + "id": "us.anthropic.claude-sonnet-4-20250514-v1:0", + "name": "Claude Sonnet 4 (US)", + "display_name": "Claude Sonnet 4 (US)", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "type": "chat" + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "openai/gpt-4.1-nano", - "name": "OpenAI: GPT-4.1 Nano", - "display_name": "OpenAI: GPT-4.1 Nano", + "id": "global.anthropic.claude-sonnet-4-20250514-v1:0", + "name": "Claude Sonnet 4 (Global)", + "display_name": "Claude Sonnet 4 (Global)", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "type": "chat" - }, - { - "id": "openai/gpt-4o", - "name": "OpenAI: gpt-4o", - "display_name": "OpenAI: gpt-4o", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } + }, + { + "id": "global.anthropic.claude-haiku-4-5-20251001-v1:0", + "name": "Claude Haiku 4.5 (Global)", + "display_name": "Claude Haiku 4.5 (Global)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "type": "chat" + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "cost": { + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 + } }, { - "id": "openai/gpt-4o-mini", - "name": "OpenAI: gpt-4o-mini", - "display_name": "OpenAI: gpt-4o-mini", + "id": "meta.llama3-3-70b-instruct-v1:0", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -67346,35 +67487,42 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0.72, + "output": 0.72 + } }, { - "id": "openai/gpt-5", - "name": "OpenAI: GPT-5", - "display_name": "OpenAI: GPT-5", + "id": "us.anthropic.claude-opus-4-5-20251101-v1:0", + "name": "Claude Opus 4.5 (US)", + "display_name": "Claude Opus 4.5 (US)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -67382,58 +67530,35 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-10-01", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "type": "chat" - }, - { - "id": "openai/gpt-5-chat", - "name": "OpenAI: GPT-5 Chat", - "display_name": "OpenAI: GPT-5 Chat", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 16384 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "type": "chat" + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + } }, { - "id": "openai/gpt-5-mini", - "name": "OpenAI: GPT-5 Mini", - "display_name": "OpenAI: GPT-5 Mini", + "id": "anthropic.claude-opus-4-6-v1", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -67441,111 +67566,137 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-10-01", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "type": "chat" + "knowledge": "2025-05", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25, + "context_over_200k": { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5 + } + } }, { - "id": "openai/gpt-5-nano", - "name": "OpenAI: GPT-5 Nano", - "display_name": "OpenAI: GPT-5 Nano", + "id": "anthropic.claude-3-opus-20240229-v1:0", + "name": "Claude Opus 3", + "display_name": "Claude Opus 3", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-10-01", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "type": "chat" + "knowledge": "2023-08", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", + "cost": { + "input": 15, + "output": 75 + } }, { - "id": "openai/gpt-5.1", - "name": "OpenAI: gpt-5.1", - "display_name": "OpenAI: gpt-5.1", + "id": "amazon.nova-pro-v1:0", + "name": "Nova Pro", + "display_name": "Nova Pro", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 300000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "type": "chat" + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", + "cost": { + "input": 0.8, + "output": 3.2, + "cache_read": 0.2 + } }, { - "id": "openai/gpt-5.2", - "name": "OpenAI: gpt-5.2", - "display_name": "OpenAI: gpt-5.2", + "id": "meta.llama3-1-8b-instruct-v1:0", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 0.22, + "output": 0.22 + } }, { - "id": "openai/gpt-5.1-chat", - "name": "OpenAI: gpt-5.1", - "display_name": "OpenAI: gpt-5.1", + "id": "us.anthropic.claude-opus-4-1-20250805-v1:0", + "name": "Claude Opus 4.1 (US)", + "display_name": "Claude Opus 4.1 (US)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -67555,34 +67706,50 @@ }, "attachment": true, "open_weights": false, - "type": "chat" + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } }, { - "id": "openai/gpt-image-1", - "name": "OpenAI: gpt-image-1", - "display_name": "OpenAI: gpt-image-1", + "id": "openai.gpt-oss-120b-1:0", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, + "limit": { + "context": 128000, + "output": 4096 + }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "type": "imageGeneration" + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "cost": { + "input": 0.15, + "output": 0.6 + } }, { - "id": "openai/gpt-oss-120b", - "name": "OpenAI: gpt-oss-120b", - "display_name": "OpenAI: gpt-oss-120b", + "id": "qwen.qwen3-32b-v1:0", + "name": "Qwen3 32B (dense)", + "display_name": "Qwen3 32B (dense)", "modalities": { "input": [ "text" @@ -67592,10 +67759,10 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 16384, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -67603,46 +67770,58 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "type": "chat" + "knowledge": "2024-04", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", + "cost": { + "input": 0.15, + "output": 0.6 + } }, { - "id": "openai/gpt-oss-20b", - "name": "OpenAI: gpt-oss-20b", - "display_name": "OpenAI: gpt-oss-20b", + "id": "anthropic.claude-3-5-sonnet-20240620-v1:0", + "name": "Claude Sonnet 3.5", + "display_name": "Claude Sonnet 3.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-06-20", + "last_updated": "2024-06-20", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "openai/o1", - "name": "OpenAI: o1", - "display_name": "OpenAI: o1", + "id": "anthropic.claude-haiku-4-5-20251001-v1:0", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -67650,20 +67829,30 @@ }, "limit": { "context": 200000, - "output": 100000 + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "type": "chat" + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "cost": { + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 + } }, { - "id": "openai/o1-mini", - "name": "OpenAI: o1-mini", - "display_name": "OpenAI: o1-mini", + "id": "cohere.command-r-v1:0", + "name": "Command R", + "display_name": "Command R", "modalities": { "input": [ "text" @@ -67674,50 +67863,60 @@ }, "limit": { "context": 128000, - "output": 65536 + "output": 4096 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "type": "chat" + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-03-11", + "last_updated": "2024-03-11", + "cost": { + "input": 0.5, + "output": 1.5 + } }, { - "id": "openai/o3", - "name": "OpenAI: o3", - "display_name": "OpenAI: o3", + "id": "mistral.voxtral-small-24b-2507", + "name": "Voxtral Small 24B 2507", + "display_name": "Voxtral Small 24B 2507", "modalities": { "input": [ "text", - "image" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 32000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "type": "chat" + "open_weights": true, + "release_date": "2025-07-01", + "last_updated": "2025-07-01", + "cost": { + "input": 0.15, + "output": 0.35 + } }, { - "id": "openai/o4-mini", - "name": "OpenAI: o4 Mini", - "display_name": "OpenAI: o4 Mini", + "id": "amazon.nova-micro-v1:0", + "name": "Nova Micro", + "display_name": "Nova Micro", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -67725,26 +67924,29 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", - "type": "chat" + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", + "cost": { + "input": 0.035, + "output": 0.14, + "cache_read": 0.00875 + } }, { - "id": "qwen/qwen3-235b-a22b-instruct-2507", - "name": "Qwen: Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen: Qwen3 235B A22B Instruct 2507", + "id": "meta.llama3-1-70b-instruct-v1:0", + "name": "Llama 3.1 70B Instruct", + "display_name": "Llama 3.1 70B Instruct", "modalities": { "input": [ "text" @@ -67754,21 +67956,28 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "type": "chat" + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 0.72, + "output": 0.72 + } }, { - "id": "qwen/qwen3-235b-a22b-thinking-2507", - "name": "Qwen: Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen: Qwen3 235B A22B Thinking 2507", + "id": "meta.llama3-70b-instruct-v1:0", + "name": "Llama 3 70B Instruct", + "display_name": "Llama 3 70B Instruct", "modalities": { "input": [ "text" @@ -67778,54 +67987,70 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 8192, + "output": 2048 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", - "type": "chat" + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 2.65, + "output": 3.5 + } }, { - "id": "qwen/qwen3-30b-a3b-instruct-2507", - "name": "Qwen: Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen: Qwen3 30B A3B Instruct 2507", + "id": "global.anthropic.claude-opus-4-6-v1", + "name": "Claude Opus 4.6 (Global)", + "display_name": "Claude Opus 4.6 (Global)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-29", - "last_updated": "2025-07-29", - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25, + "context_over_200k": { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5 + } + } }, { - "id": "qwen/qwen3-30b-a3b-thinking-2507", - "name": "Qwen: Qwen3 30B A3B Thinking 2507", - "display_name": "Qwen: Qwen3 30B A3B Thinking 2507", + "id": "deepseek.r1-v1:0", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ "text" @@ -67835,47 +68060,64 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "type": "chat" + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-29", + "cost": { + "input": 1.35, + "output": 5.4 + } }, { - "id": "qwen/qwen3-8b", - "name": "Qwen: Qwen3 8B", - "display_name": "Qwen: Qwen3 8B", + "id": "anthropic.claude-3-5-sonnet-20241022-v2:0", + "name": "Claude Sonnet 3.5 v2", + "display_name": "Claude Sonnet 3.5 v2", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 20000 + "context": 200000, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "qwen/qwen3-coder", - "name": "Qwen: Qwen3 Coder 480B A35B", - "display_name": "Qwen: Qwen3 Coder 480B A35B", + "id": "mistral.ministral-3-8b-instruct", + "name": "Ministral 3 8B", + "display_name": "Ministral 3 8B", "modalities": { "input": [ "text" @@ -67885,25 +68127,27 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", - "type": "chat" + "open_weights": false, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "cost": { + "input": 0.15, + "output": 0.15 + } }, { - "id": "qwen/qwen3-coder-30b-a3b-instruct", - "name": "Qwen: Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen: Qwen3 Coder 30B A3B Instruct", + "id": "cohere.command-text-v14", + "name": "Command", + "display_name": "Command", "modalities": { "input": [ "text" @@ -67912,81 +68156,104 @@ "text" ] }, - "limit": { - "context": 262144, - "output": 262144 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "type": "chat" - }, - { - "id": "qwen/qwen3-coder-480b-a35b-instruct", - "name": "Qwen: Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen: Qwen3 Coder 480B A35B Instruct", "limit": { "context": 4096, "output": 4096 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2023-08", + "release_date": "2023-11-01", + "last_updated": "2023-11-01", + "cost": { + "input": 1.5, + "output": 2 } }, { - "id": "qwen/qwen3-embedding-0.6b", - "name": "qwen/qwen3-embedding-0.6b", - "display_name": "qwen/qwen3-embedding-0.6b", + "id": "us.anthropic.claude-haiku-4-5-20251001-v1:0", + "name": "Claude Haiku 4.5 (US)", + "display_name": "Claude Haiku 4.5 (US)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "embedding" + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "cost": { + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 + } }, { - "id": "qwen/qwen3-embedding-4b", - "name": "qwen/qwen3-embedding-4b", - "display_name": "qwen/qwen3-embedding-4b", + "id": "anthropic.claude-opus-4-20250514-v1:0", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "embedding" + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } }, { - "id": "qwen/qwen3-embedding-8b", - "name": "qwen/qwen3-embedding-8b", - "display_name": "qwen/qwen3-embedding-8b", + "id": "mistral.voxtral-mini-3b-2507", + "name": "Voxtral Mini 3B 2507", + "display_name": "Voxtral Mini 3B 2507", "modalities": { "input": [ + "audio", "text" ], "output": [ @@ -67994,83 +68261,112 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "embedding" + "attachment": false, + "open_weights": false, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "cost": { + "input": 0.04, + "output": 0.04 + } }, { - "id": "qwen/qwen3-next-80b-a3b-instruct", - "name": "Qwen: Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen: Qwen3 Next 80B A3B Instruct", + "id": "global.anthropic.claude-sonnet-4-5-20250929-v1:0", + "name": "Claude Sonnet 4.5 (Global)", + "display_name": "Claude Sonnet 4.5 (Global)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-11", - "last_updated": "2025-09-11", - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "qwen/qwen3-next-80b-a3b-thinking", - "name": "Qwen: Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen: Qwen3 Next 80B A3B Thinking", + "id": "global.anthropic.claude-opus-4-5-20251101-v1:0", + "name": "Claude Opus 4.5 (Global)", + "display_name": "Claude Opus 4.5 (Global)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + } }, { - "id": "qwen/qwen3-omni-30b-a3b-instruct", - "name": "Qwen: Qwen3 VL 30B A3B Instruct", - "display_name": "Qwen: Qwen3 VL 30B A3B Instruct", + "id": "amazon.nova-2-lite-v1:0", + "name": "Nova 2 Lite", + "display_name": "Nova 2 Lite", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -68078,91 +68374,62 @@ "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "cost": { + "input": 0.33, + "output": 2.75 + } }, { - "id": "qwen/qwen3-omni-30b-a3b-thinking", - "name": "Qwen: Qwen3 VL 30B A3B Thinking", - "display_name": "Qwen: Qwen3 VL 30B A3B Thinking", + "id": "qwen.qwen3-coder-480b-a35b-v1:0", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "type": "chat" - }, - { - "id": "qwen/qwen3-reranker-0.6b", - "name": "qwen/qwen3-reranker-0.6b", - "display_name": "qwen/qwen3-reranker-0.6b", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "type": "rerank" - }, - { - "id": "qwen/qwen3-reranker-4b", - "name": "qwen/qwen3-reranker-4b", - "display_name": "qwen/qwen3-reranker-4b", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "type": "rerank" - }, - { - "id": "qwen/qwen3-reranker-8b", - "name": "qwen/qwen3-reranker-8b", - "display_name": "qwen/qwen3-reranker-8b", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, "reasoning": { "supported": false }, - "type": "rerank" + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", + "cost": { + "input": 0.22, + "output": 1.8 + } }, { - "id": "qwen/qwen3-vl-235b-a22b-instruct", - "name": "Qwen: Qwen3 VL 235B A22B Instruct", - "display_name": "Qwen: Qwen3 VL 235B A22B Instruct", + "id": "anthropic.claude-sonnet-4-5-20250929-v1:0", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -68170,51 +68437,63 @@ "supported": true, "default": true }, - "attachment": false, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "qwen/qwen3-vl-235b-a22b-thinking", - "name": "Qwen: Qwen3 VL 235B A22B Thinking", - "display_name": "Qwen: Qwen3 VL 235B A22B Thinking", + "id": "openai.gpt-oss-safeguard-20b", + "name": "GPT OSS Safeguard 20B", + "display_name": "GPT OSS Safeguard 20B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "cost": { + "input": 0.07, + "output": 0.2 + } }, { - "id": "qwen/qwen3-vl-30b-a3b-instruct", - "name": "Qwen: Qwen3 VL 30B A3B Instruct", - "display_name": "Qwen: Qwen3 VL 30B A3B Instruct", + "id": "openai.gpt-oss-20b-1:0", + "name": "gpt-oss-20b", + "display_name": "gpt-oss-20b", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -68222,38 +68501,49 @@ "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "cost": { + "input": 0.07, + "output": 0.3 + } }, { - "id": "qwen/qwen3-vl-30b-a3b-thinking", - "name": "Qwen: Qwen3 VL 30B A3B Thinking", - "display_name": "Qwen: Qwen3 VL 30B A3B Thinking", + "id": "meta.llama3-2-3b-instruct-v1:0", + "name": "Llama 3.2 3B Instruct", + "display_name": "Llama 3.2 3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "type": "chat" + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "cost": { + "input": 0.15, + "output": 0.15 + } }, { - "id": "tencent/hunyuan-mt-7b", - "name": "Tencent: Hunyuan A13B Instruct", - "display_name": "Tencent: Hunyuan A13B Instruct", + "id": "anthropic.claude-instant-v1", + "name": "Claude Instant", + "display_name": "Claude Instant", "modalities": { "input": [ "text" @@ -68263,45 +68553,62 @@ ] }, "limit": { - "context": 32768 + "context": 100000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "type": "chat" + "open_weights": false, + "knowledge": "2023-08", + "release_date": "2023-03-01", + "last_updated": "2023-03-01", + "cost": { + "input": 0.8, + "output": 2.4 + } }, { - "id": "x-ai/grok-2-image", - "name": "grok-2", - "display_name": "grok-2", + "id": "amazon.nova-premier-v1:0", + "name": "Nova Premier", + "display_name": "Nova Premier", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1000000, + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", + "cost": { + "input": 2.5, + "output": 12.5 + } }, { - "id": "x-ai/grok-3", - "name": "xAI: Grok 3", - "display_name": "xAI: Grok 3", + "id": "mistral.mistral-7b-instruct-v0:2", + "name": "Mistral-7B-Instruct-v0.3", + "display_name": "Mistral-7B-Instruct-v0.3", "modalities": { "input": [ "text" @@ -68311,57 +68618,65 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 127000, + "output": 127000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", - "type": "chat" + "open_weights": true, + "release_date": "2025-04-01", + "last_updated": "2025-04-01", + "cost": { + "input": 0.11, + "output": 0.11 + } }, { - "id": "x-ai/grok-3-mini", - "name": "xAI: Grok 3 Mini", - "display_name": "xAI: Grok 3 Mini", + "id": "eu.anthropic.claude-sonnet-4-20250514-v1:0", + "name": "Claude Sonnet 4 (EU)", + "display_name": "Claude Sonnet 4 (EU)", "modalities": { "input": [ - "text" - ], + "text", + "image", + "pdf" + ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-17", - "last_updated": "2025-02-17", - "type": "chat" + "knowledge": "2024-04", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "x-ai/grok-4", - "name": "xAI: Grok 4", - "display_name": "xAI: Grok 4", + "id": "mistral.mixtral-8x7b-instruct-v0:1", + "name": "Mixtral-8x7B-Instruct-v0.1", + "display_name": "Mixtral-8x7B-Instruct-v0.1", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -68369,54 +68684,95 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 32000, + "output": 32000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", - "type": "chat" + "open_weights": true, + "release_date": "2025-04-01", + "last_updated": "2025-04-01", + "cost": { + "input": 0.7, + "output": 0.7 + } }, { - "id": "x-ai/grok-4-fast-non-reasoning", - "name": "x-ai/grok-4-fast-non-reasoning", - "display_name": "x-ai/grok-4-fast-non-reasoning", + "id": "anthropic.claude-opus-4-1-20250805-v1:0", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } }, { - "id": "x-ai/grok-4-fast-reasoning", - "name": "x-ai/grok-4-fast-reasoning", - "display_name": "x-ai/grok-4-fast-reasoning", + "id": "meta.llama4-scout-17b-instruct-v1:0", + "name": "Llama 4 Scout 17B Instruct", + "display_name": "Llama 4 Scout 17B Instruct", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 3500000, + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "cost": { + "input": 0.17, + "output": 0.66 + } }, { - "id": "x-ai/grok-code-fast-1", - "name": "xAI: Grok Code Fast 1", - "display_name": "xAI: Grok Code Fast 1", + "id": "ai21.jamba-1-5-mini-v1:0", + "name": "Jamba 1.5 Mini", + "display_name": "Jamba 1.5 Mini", "modalities": { "input": [ "text" @@ -68427,25 +68783,27 @@ }, "limit": { "context": 256000, - "output": 10000 + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-08", - "release_date": "2025-08-26", - "last_updated": "2025-08-26", - "type": "chat" + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2024-08-15", + "last_updated": "2024-08-15", + "cost": { + "input": 0.2, + "output": 0.4 + } }, { - "id": "z-ai/glm-4.5", - "name": "Z.AI: GLM 4.5", - "display_name": "Z.AI: GLM 4.5", + "id": "meta.llama3-8b-instruct-v1:0", + "name": "Llama 3 8B Instruct", + "display_name": "Llama 3 8B Instruct", "modalities": { "input": [ "text" @@ -68455,26 +68813,28 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 8192, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", - "type": "chat" + "knowledge": "2023-03", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 0.3, + "output": 0.6 + } }, { - "id": "z-ai/glm-4.5-flash", - "name": "z-ai/glm-4.5-flash", - "display_name": "z-ai/glm-4.5-flash", + "id": "amazon.titan-text-express-v1:0:8k", + "name": "Titan Text G1 - Express", + "display_name": "Titan Text G1 - Express", "modalities": { "input": [ "text" @@ -68484,49 +68844,60 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": false, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "cost": { + "input": 0.2, + "output": 0.6 + } }, { - "id": "z-ai/glm-4.5v", - "name": "Z.AI: GLM 4.5V", - "display_name": "Z.AI: GLM 4.5V", + "id": "anthropic.claude-3-sonnet-20240229-v1:0", + "name": "Claude Sonnet 3", + "display_name": "Claude Sonnet 3", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-11", - "last_updated": "2025-08-11", - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2023-08", + "release_date": "2024-03-04", + "last_updated": "2024-03-04", + "cost": { + "input": 3, + "output": 15 + } }, { - "id": "z-ai/glm-4.6", - "name": "Z.AI: GLM 4.6", - "display_name": "Z.AI: GLM 4.6", + "id": "nvidia.nemotron-nano-9b-v2", + "name": "NVIDIA Nemotron Nano 9B v2", + "display_name": "NVIDIA Nemotron Nano 9B v2", "modalities": { "input": [ "text" @@ -68536,29 +68907,32 @@ ] }, "limit": { - "context": 202752, - "output": 202752 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-09", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", - "type": "chat" + "open_weights": false, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "cost": { + "input": 0.06, + "output": 0.23 + } }, { - "id": "z-ai/glm-4.7", - "name": "Z.AI: GLM 4.7", - "display_name": "Z.AI: GLM 4.7", + "id": "eu.anthropic.claude-sonnet-4-5-20250929-v1:0", + "name": "Claude Sonnet 4.5 (EU)", + "display_name": "Claude Sonnet 4.5 (EU)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -68566,7 +68940,7 @@ }, "limit": { "context": 200000, - "output": 200000 + "output": 64000 }, "temperature": true, "tool_call": true, @@ -68574,19 +68948,22 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.273974, - "output": 1.095896, - "cache_read": 0.054795 - }, - "type": "chat" + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + } }, { - "id": "xiaomi/mimo-v2-flash", - "name": "Xiaomi: Mimo V2 Flash", - "display_name": "Xiaomi: Mimo V2 Flash", + "id": "amazon.titan-text-express-v1", + "name": "Titan Text G1 - Express", + "display_name": "Titan Text G1 - Express", "modalities": { "input": [ "text" @@ -68596,57 +68973,59 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.1918, - "output": 0.5754, - "cache_read": 0.03836 - }, - "type": "chat" + "input": 0.2, + "output": 0.6 + } }, { - "id": "xiaomimimo/mimo-v2-flash", - "name": "Xiaomi: Mimo V2 Flash", - "display_name": "Xiaomi: Mimo V2 Flash", + "id": "meta.llama4-maverick-17b-instruct-v1:0", + "name": "Llama 4 Maverick 17B Instruct", + "display_name": "Llama 4 Maverick 17B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1000000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.1918, - "output": 0.5754, - "cache_read": 0.03836 - }, - "type": "chat" + "input": 0.24, + "output": 0.97 + } }, { - "id": "minimax/minimax-m2.1", - "name": "MiniMax: minimax-m2.1", - "display_name": "MiniMax: minimax-m2.1", + "id": "mistral.ministral-3-14b-instruct", + "name": "Ministral 14B 3.0", + "display_name": "Ministral 14B 3.0", "modalities": { "input": [ "text" @@ -68656,26 +69035,27 @@ ] }, "limit": { - "context": 204800, - "output": 204800 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.288, - "output": 1.152 - }, - "type": "chat" + "input": 0.2, + "output": 0.2 + } }, { - "id": "minimax/minimax-m2.1-lightning", - "name": "MiniMax: minimax-m2.1-lightning", - "display_name": "MiniMax: minimax-m2.1-lightning", + "id": "openai.gpt-oss-safeguard-120b", + "name": "GPT OSS Safeguard 120B", + "display_name": "GPT OSS Safeguard 120B", "modalities": { "input": [ "text" @@ -68685,1242 +69065,12459 @@ ] }, "limit": { - "context": 204800, - "output": 204800 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.144, - "output": 0.576 - }, - "type": "chat" - } - ] - }, - "doubao": { - "id": "doubao", - "name": "Doubao", - "display_name": "Doubao", - "models": [ + "input": 0.15, + "output": 0.6 + } + }, { - "id": "deepseek-v3-1-250821", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "qwen.qwen3-235b-a22b-2507-v1:0", + "name": "Qwen3 235B A22B 2507", + "display_name": "Qwen3 235B A22B 2507", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 128000, - "output": 32000 + "context": 262144, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", + "cost": { + "input": 0.22, + "output": 0.88 + } }, { - "id": "deepseek-r1-250120", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", - "limit": { - "context": 64000, - "output": 4096 - }, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true + "id": "us.anthropic.claude-opus-4-20250514-v1:0", + "name": "Claude Opus 4 (US)", + "display_name": "Claude Opus 4 (US)", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] }, - "type": "chat" - }, - { - "id": "deepseek-r1-distill-qwen-32b-250120", - "name": "DeepSeek R1 Distill Qwen 32B", - "display_name": "DeepSeek R1 Distill Qwen 32B", "limit": { - "context": 32000, - "output": 4096 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + } }, { - "id": "deepseek-r1-distill-qwen-7b-250120", - "name": "DeepSeek R1 Distill Qwen 7B", - "display_name": "DeepSeek R1 Distill Qwen 7B", - "limit": { - "context": 32000, - "output": 4096 - }, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true + "id": "amazon.nova-lite-v1:0", + "name": "Nova Lite", + "display_name": "Nova Lite", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] }, - "type": "chat" - }, - { - "id": "deepseek-v3-250324", - "name": "DeepSeek V3", - "display_name": "DeepSeek V3", "limit": { - "context": 64000, - "output": 4096 + "context": 300000, + "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", + "cost": { + "input": 0.06, + "output": 0.24, + "cache_read": 0.015 + } }, { - "id": "doubao-seed-1-6-vision-250815", - "name": "Doubao Seed 1.6 Vision", - "display_name": "Doubao Seed 1.6 Vision", - "limit": { - "context": 256000, - "output": 32000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true + "id": "anthropic.claude-3-5-haiku-20241022-v1:0", + "name": "Claude Haiku 3.5", + "display_name": "Claude Haiku 3.5", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] }, - "type": "chat" - }, - { - "id": "doubao-seed-1-6-250615", - "name": "Doubao Seed 1.6", - "display_name": "Doubao Seed 1.6", "limit": { - "context": 256000, - "output": 32000 + "context": 200000, + "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "cost": { + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 + } }, { - "id": "doubao-seed-1-6-flash-250715", - "name": "Doubao Seed 1.6 Flash", - "display_name": "Doubao Seed 1.6 Flash", - "limit": { - "context": 256000, - "output": 32000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true + "id": "moonshot.kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] }, - "type": "chat" - }, - { - "id": "doubao-seed-1-6-flash-250615", - "name": "Doubao Seed 1.6 Flash (250615)", - "display_name": "Doubao Seed 1.6 Flash (250615)", "limit": { "context": 256000, - "output": 32000 + "output": 256000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "release_date": "2025-12-02", + "last_updated": "2025-12-02", + "cost": { + "input": 0.6, + "output": 2.5 + } }, { - "id": "doubao-seed-1-6-thinking-250715", - "name": "Doubao Seed 1.6 Thinking", - "display_name": "Doubao Seed 1.6 Thinking", + "id": "eu.anthropic.claude-opus-4-5-20251101-v1:0", + "name": "Claude Opus 4.5 (EU)", + "display_name": "Claude Opus 4.5 (EU)", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 256000, - "output": 32000 + "context": 200000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + } }, { - "id": "doubao-seed-1-6-thinking-250615", - "name": "Doubao Seed 1.6 Thinking (250615)", - "display_name": "Doubao Seed 1.6 Thinking (250615)", + "id": "eu.anthropic.claude-opus-4-6-v1", + "name": "Claude Opus 4.6 (EU)", + "display_name": "Claude Opus 4.6 (EU)", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 256000, - "output": 32000 + "context": 1000000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25, + "context_over_200k": { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5 + } + } } ] }, - "ppinfra": { - "id": "ppinfra", - "name": "PPInfra", - "display_name": "PPInfra", + "poe": { + "id": "poe", + "name": "Poe", + "display_name": "Poe", + "api": "https://api.poe.com/v1", + "doc": "https://creator.poe.com/docs/external-applications/openai-compatible-api", "models": [ { - "id": "zai-org/autoglm-phone-9b-multilingual", - "name": "AutoGLM-Phone-9B-Multilingual", - "display_name": "AutoGLM-Phone-9B-Multilingual", + "id": "xai/grok-4-fast-non-reasoning", + "name": "Grok-4-Fast-Non-Reasoning", + "display_name": "Grok-4-Fast-Non-Reasoning", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 65536, - "output": 32000 + "context": 2000000, + "output": 128000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-09-16", + "last_updated": "2025-09-16", + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + } }, { - "id": "baichuan/baichuan-m2-32b", - "name": "BaiChuan M2 32B", - "display_name": "BaiChuan M2 32B", + "id": "xai/grok-4-fast-reasoning", + "name": "Grok 4 Fast Reasoning", + "display_name": "Grok 4 Fast Reasoning", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 131072, - "output": 131072 + "context": 2000000, + "output": 128000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-09-16", + "last_updated": "2025-09-16", + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + } }, { - "id": "deepseek/deepseek-prover-v2-671b", - "name": "Deepseek Prover V2 671B", - "display_name": "Deepseek Prover V2 671B", - "limit": { - "context": 160000, - "output": 160000 - }, - "tool_call": false, - "reasoning": { - "supported": false + "id": "xai/grok-4.1-fast-reasoning", + "name": "Grok-4.1-Fast-Reasoning", + "display_name": "Grok-4.1-Fast-Reasoning", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] }, - "type": "chat" - }, - { - "id": "deepseek/deepseek-r1/community", - "name": "DeepSeek R1 (Community)", - "display_name": "DeepSeek R1 (Community)", "limit": { - "context": 64000, - "output": 4000 + "context": 2000000, + "output": 30000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-11-19", + "last_updated": "2025-11-19" }, { - "id": "deepseek/deepseek-r1-turbo", - "name": "DeepSeek R1 (Turbo)", - "display_name": "DeepSeek R1 (Turbo)", + "id": "xai/grok-4", + "name": "Grok 4", + "display_name": "Grok 4", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 64000, - "output": 16000 + "context": 256000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-07-10", + "last_updated": "2025-07-10", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.75 + } }, { - "id": "deepseek/deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "xai/grok-code-fast-1", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 32000, - "output": 8000 + "context": 256000, + "output": 128000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-08-22", + "last_updated": "2025-08-22", + "cost": { + "input": 0.2, + "output": 1.5, + "cache_read": 0.02 + } }, { - "id": "deepseek/deepseek-v3/community", - "name": "DeepSeek V3 (Community)", - "display_name": "DeepSeek V3 (Community)", - "limit": { - "context": 64000, - "output": 4000 - }, - "tool_call": true, - "reasoning": { - "supported": false + "id": "xai/grok-4.1-fast-non-reasoning", + "name": "Grok-4.1-Fast-Non-Reasoning", + "display_name": "Grok-4.1-Fast-Non-Reasoning", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] }, - "type": "chat" - }, - { - "id": "deepseek/deepseek-v3-turbo", - "name": "DeepSeek V3 (Turbo)", - "display_name": "DeepSeek V3 (Turbo)", "limit": { - "context": 64000, - "output": 16000 + "context": 2000000, + "output": 30000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-11-19", + "last_updated": "2025-11-19" }, { - "id": "deepseek/deepseek-v3-0324", - "name": "DeepSeek V3 0324", - "display_name": "DeepSeek V3 0324", + "id": "xai/grok-3", + "name": "Grok 3", + "display_name": "Grok 3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 163840, - "output": 163840 + "context": 131072, + "output": 8192 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-04-11", + "last_updated": "2025-04-11", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.75 + } }, { - "id": "deepseek/deepseek-v3.1", - "name": "Deepseek V3.1", - "display_name": "Deepseek V3.1", + "id": "xai/grok-3-mini", + "name": "Grok 3 Mini", + "display_name": "Grok 3 Mini", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, "limit": { "context": 131072, - "output": 32768 + "output": 8192 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-04-11", + "last_updated": "2025-04-11", + "cost": { + "input": 0.3, + "output": 0.5, + "cache_read": 0.075 + } }, { - "id": "deepseek/deepseek-v3.1-terminus", - "name": "Deepseek V3.1 Terminus", - "display_name": "Deepseek V3.1 Terminus", + "id": "ideogramai/ideogram", + "name": "Ideogram", + "display_name": "Ideogram", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, "limit": { - "context": 131072, - "output": 65536 + "context": 150, + "output": 0 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2024-04-03", + "last_updated": "2024-04-03" }, { - "id": "deepseek/deepseek-v3.2", - "name": "Deepseek V3.2", - "display_name": "Deepseek V3.2", + "id": "ideogramai/ideogram-v2a", + "name": "Ideogram-v2a", + "display_name": "Ideogram-v2a", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, "limit": { - "context": 163840, - "output": 65536 + "context": 150, + "output": 0 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-02-27", + "last_updated": "2025-02-27" }, { - "id": "deepseek/deepseek-v3.2-exp", - "name": "Deepseek V3.2 Exp", - "display_name": "Deepseek V3.2 Exp", + "id": "ideogramai/ideogram-v2a-turbo", + "name": "Ideogram-v2a-Turbo", + "display_name": "Ideogram-v2a-Turbo", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, "limit": { - "context": 163840, - "output": 65536 + "context": 150, + "output": 0 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-02-27", + "last_updated": "2025-02-27" }, { - "id": "deepseek/deepseek-ocr", - "name": "DeepSeek-OCR", - "display_name": "DeepSeek-OCR", + "id": "ideogramai/ideogram-v2", + "name": "Ideogram-v2", + "display_name": "Ideogram-v2", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 150, + "output": 0 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2024-08-21", + "last_updated": "2024-08-21" }, { - "id": "deepseek/deepseek-r1-0528-qwen3-8b", - "name": "DeepSeek-R1-0528-Qwen3-8B", - "display_name": "DeepSeek-R1-0528-Qwen3-8B", - "limit": { - "context": 128000, - "output": 32000 - }, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true + "id": "runwayml/runway", + "name": "Runway", + "display_name": "Runway", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "video" + ] }, - "type": "chat" - }, - { - "id": "deepseek/deepseek-r1-distill-qwen-14b", - "name": "DeepSeek: DeepSeek R1 Distill Qwen 14B", - "display_name": "DeepSeek: DeepSeek R1 Distill Qwen 14B", "limit": { - "context": 64000, - "output": 8000 + "context": 256, + "output": 0 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2024-10-11", + "last_updated": "2024-10-11" }, { - "id": "deepseek/deepseek-r1-distill-qwen-32b", - "name": "DeepSeek: DeepSeek R1 Distill Qwen 32B", - "display_name": "DeepSeek: DeepSeek R1 Distill Qwen 32B", - "limit": { - "context": 64000, - "output": 8000 - }, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true + "id": "runwayml/runway-gen-4-turbo", + "name": "Runway-Gen-4-Turbo", + "display_name": "Runway-Gen-4-Turbo", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "video" + ] }, - "type": "chat" - }, - { - "id": "deepseek/deepseek-r1-0528", - "name": "deepseek/deepseek-r1-0528", - "display_name": "deepseek/deepseek-r1-0528", "limit": { - "context": 163840, - "output": 32768 + "context": 256, + "output": 0 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-05-09", + "last_updated": "2025-05-09" }, { - "id": "baidu/ernie-4.5-21b-a3b-thinking", - "name": "Ernie 4.5 21B A3B Thinking", - "display_name": "Ernie 4.5 21B A3B Thinking", + "id": "poetools/claude-code", + "name": "claude-code", + "display_name": "claude-code", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 131072, - "output": 65536 + "context": 0, + "output": 0 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-11-27", + "last_updated": "2025-11-27" }, { - "id": "baidu/ernie-4.5-0.3b", - "name": "ERNIE-4.5-0.3B", - "display_name": "ERNIE-4.5-0.3B", + "id": "elevenlabs/elevenlabs-v3", + "name": "ElevenLabs-v3", + "display_name": "ElevenLabs-v3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, "limit": { - "context": 120000, - "output": 8000 + "context": 128000, + "output": 0 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-06-05", + "last_updated": "2025-06-05" }, { - "id": "baidu/ernie-4.5-21B-a3b", - "name": "ERNIE-4.5-21B-A3B", - "display_name": "ERNIE-4.5-21B-A3B", + "id": "elevenlabs/elevenlabs-music", + "name": "ElevenLabs-Music", + "display_name": "ElevenLabs-Music", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, "limit": { - "context": 120000, - "output": 8000 + "context": 2000, + "output": 0 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-08-29", + "last_updated": "2025-08-29" }, { - "id": "baidu/ernie-4.5-300b-a47b-paddle", - "name": "ERNIE-4.5-300B-A47B", - "display_name": "ERNIE-4.5-300B-A47B", + "id": "elevenlabs/elevenlabs-v2.5-turbo", + "name": "ElevenLabs-v2.5-Turbo", + "display_name": "ElevenLabs-v2.5-Turbo", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, "limit": { - "context": 123000, - "output": 12000 + "context": 128000, + "output": 0 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2024-10-28", + "last_updated": "2024-10-28" }, { - "id": "baidu/ernie-4.5-vl-28b-a3b", - "name": "ERNIE-4.5-VL-28B-A3B", - "display_name": "ERNIE-4.5-VL-28B-A3B", - "limit": { - "context": 30000, - "output": 8000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true + "id": "google/gemini-deep-research", + "name": "gemini-deep-research", + "display_name": "gemini-deep-research", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] }, - "type": "chat" - }, - { - "id": "baidu/ernie-4.5-vl-424b-a47b", - "name": "ERNIE-4.5-VL-424B-A47B", - "display_name": "ERNIE-4.5-VL-424B-A47B", "limit": { - "context": 123000, - "output": 16000 + "context": 1048576, + "output": 0 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 1.6, + "output": 9.6 + } }, { - "id": "zai-org/glm-4.5v", - "name": "GLM 4.5V", - "display_name": "GLM 4.5V", + "id": "google/nano-banana", + "name": "Nano-Banana", + "display_name": "Nano-Banana", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text", + "image" + ] + }, "limit": { "context": 65536, - "output": 16384 + "output": 0 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-08-21", + "last_updated": "2025-08-21", + "cost": { + "input": 0.21, + "output": 1.8, + "cache_read": 0.021 + } }, { - "id": "zai-org/glm-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "google/imagen-4", + "name": "Imagen-4", + "display_name": "Imagen-4", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, "limit": { - "context": 204800, - "output": 131072 + "context": 480, + "output": 0 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-05-22", + "last_updated": "2025-05-22" }, { - "id": "zai-org/glm-4.6v", - "name": "GLM 4.6v", - "display_name": "GLM 4.6v", + "id": "google/imagen-3", + "name": "Imagen-3", + "display_name": "Imagen-3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, "limit": { - "context": 131072, - "output": 32768 + "context": 480, + "output": 0 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2024-10-15", + "last_updated": "2024-10-15" }, { - "id": "zai-org/glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "google/imagen-4-ultra", + "name": "Imagen-4-Ultra", + "display_name": "Imagen-4-Ultra", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, "limit": { - "context": 131072, - "output": 98304 + "context": 480, + "output": 0 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-05-24", + "last_updated": "2025-05-24" }, { - "id": "zai-org/glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 204800, - "output": 131072 + "context": 1065535, + "output": 65535 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-04-26", + "last_updated": "2025-04-26", + "cost": { + "input": 0.21, + "output": 1.8, + "cache_read": 0.021 + } }, { - "id": "kat-coder", - "name": "KAT Coder Pro V1", - "display_name": "KAT Coder Pro V1", + "id": "google/gemini-2.0-flash-lite", + "name": "Gemini-2.0-Flash-Lite", + "display_name": "Gemini-2.0-Flash-Lite", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 256000, - "output": 128000 + "context": 990000, + "output": 8192 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-02-05", + "last_updated": "2025-02-05", + "cost": { + "input": 0.052, + "output": 0.21 + } }, { - "id": "moonshotai/kimi-k2-0905", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "google/gemini-3-pro", + "name": "Gemini-3-Pro", + "display_name": "Gemini-3-Pro", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 64000 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-10-22", + "last_updated": "2025-10-22", + "cost": { + "input": 1.6, + "output": 9.6, + "cache_read": 0.16 + } }, { - "id": "moonshotai/kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "google/veo-3.1", + "name": "Veo-3.1", + "display_name": "Veo-3.1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "video" + ] + }, "limit": { - "context": 131072, - "output": 128000 + "context": 480, + "output": 0 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-10-15", + "last_updated": "2025-10-15" }, { - "id": "moonshotai/kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "google/imagen-3-fast", + "name": "Imagen-3-Fast", + "display_name": "Imagen-3-Fast", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, "limit": { - "context": 262144, - "output": 262144 + "context": 480, + "output": 0 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2024-10-17", + "last_updated": "2024-10-17" }, { - "id": "minimax/minimax-m2.1", - "name": "MiniMax M2.1", - "display_name": "MiniMax M2.1", + "id": "google/lyria", + "name": "Lyria", + "display_name": "Lyria", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, "limit": { - "context": 204800, - "output": 131072 + "context": 0, + "output": 0 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-06-04", + "last_updated": "2025-06-04" }, { - "id": "minimax/minimax-m2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "google/gemini-2.0-flash", + "name": "Gemini-2.0-Flash", + "display_name": "Gemini-2.0-Flash", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 204800, - "output": 131072 + "context": 990000, + "output": 8192 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" - }, + "attachment": true, + "open_weights": false, + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "cost": { + "input": 0.1, + "output": 0.42 + } + }, { - "id": "minimaxai/minimax-m1-80k", - "name": "MiniMaxAI/MiniMax-M1-80k", - "display_name": "MiniMaxAI/MiniMax-M1-80k", + "id": "google/gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 128000, - "output": 40000 + "context": 1024000, + "output": 64000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-06-19", + "last_updated": "2025-06-19", + "cost": { + "input": 0.07, + "output": 0.28 + } }, { - "id": "paddlepaddle/paddleocr-vl", - "name": "PaddleOCR-VL", - "display_name": "PaddleOCR-VL", + "id": "google/veo-3", + "name": "Veo-3", + "display_name": "Veo-3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "video" + ] + }, "limit": { - "context": 16384, - "output": 16384 + "context": 480, + "output": 0 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-05-21", + "last_updated": "2025-05-21" }, { - "id": "qwen/qwen2.5-7b-instruct", - "name": "Qwen 2.5 7B Instruct", - "display_name": "Qwen 2.5 7B Instruct", + "id": "google/veo-3-fast", + "name": "Veo-3-Fast", + "display_name": "Veo-3-Fast", + "modalities": { + "input": [ + "text" + ], + "output": [ + "video" + ] + }, "limit": { - "context": 32000, - "output": 32000 + "context": 480, + "output": 0 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-10-13", + "last_updated": "2025-10-13" }, { - "id": "qwen/qwen3-omni-30b-a3b-instruct", - "name": "qwen/qwen3-omni-30b-a3b-instruct", - "display_name": "qwen/qwen3-omni-30b-a3b-instruct", + "id": "google/imagen-4-fast", + "name": "Imagen-4-Fast", + "display_name": "Imagen-4-Fast", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, "limit": { - "context": 65536, - "output": 16384 + "context": 480, + "output": 0 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-06-25", + "last_updated": "2025-06-25" }, { - "id": "qwen/qwen3-omni-30b-a3b-thinking", - "name": "qwen/qwen3-omni-30b-a3b-thinking", - "display_name": "qwen/qwen3-omni-30b-a3b-thinking", + "id": "google/veo-2", + "name": "Veo-2", + "display_name": "Veo-2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "video" + ] + }, "limit": { - "context": 65536, - "output": 16384 + "context": 480, + "output": 0 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2024-12-02", + "last_updated": "2024-12-02" }, { - "id": "qwen/qwen3-vl-30b-a3b-instruct", - "name": "qwen/qwen3-vl-30b-a3b-instruct", - "display_name": "qwen/qwen3-vl-30b-a3b-instruct", + "id": "google/gemini-3-flash", + "name": "gemini-3-flash", + "display_name": "gemini-3-flash", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 131072, - "output": 32768 + "context": 1048576, + "output": 65536 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-10-07", + "last_updated": "2025-10-07", + "cost": { + "input": 0.4, + "output": 2.4, + "cache_read": 0.04 + } }, { - "id": "qwen/qwen3-vl-30b-a3b-thinking", - "name": "qwen/qwen3-vl-30b-a3b-thinking", - "display_name": "qwen/qwen3-vl-30b-a3b-thinking", + "id": "google/nano-banana-pro", + "name": "Nano-Banana-Pro", + "display_name": "Nano-Banana-Pro", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, "limit": { - "context": 131072, - "output": 32768 + "context": 65536, + "output": 0 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-11-19", + "last_updated": "2025-11-19", + "cost": { + "input": 2, + "output": 12, + "cache_read": 0.2 + } }, { - "id": "qwen/qwen3-vl-8b-instruct", - "name": "qwen/qwen3-vl-8b-instruct", - "display_name": "qwen/qwen3-vl-8b-instruct", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 131072, - "output": 32768 + "context": 1065535, + "output": 65535 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-02-05", + "last_updated": "2025-02-05", + "cost": { + "input": 0.87, + "output": 7, + "cache_read": 0.087 + } }, { - "id": "qwen/qwen-2.5-72b-instruct", - "name": "Qwen2.5 72B Instruct", - "display_name": "Qwen2.5 72B Instruct", + "id": "google/veo-3.1-fast", + "name": "Veo-3.1-Fast", + "display_name": "Veo-3.1-Fast", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "video" + ] + }, "limit": { - "context": 32000, - "output": 16000 + "context": 480, + "output": 0 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-10-15", + "last_updated": "2025-10-15" }, { - "id": "qwen/qwen2.5-vl-72b-instruct", - "name": "Qwen2.5 VL 72B Instruct", - "display_name": "Qwen2.5 VL 72B Instruct", + "id": "openai/gpt-4.1-nano", + "name": "GPT-4.1-nano", + "display_name": "GPT-4.1-nano", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 32000, - "output": 32000 + "context": 1047576, + "output": 32768 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", + "cost": { + "input": 0.09, + "output": 0.36, + "cache_read": 0.022 + } }, { - "id": "qwen/qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "openai/gpt-5.2-instant", + "name": "gpt-5.2-instant", + "display_name": "gpt-5.2-instant", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 262144, - "output": 260000 + "context": 128000, + "output": 16384 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 1.6, + "output": 13, + "cache_read": 0.16 + } }, { - "id": "qwen/qwen3-235b-a22b-thinking-2507", - "name": "Qwen3 235B A22b Thinking 2507", - "display_name": "Qwen3 235B A22b Thinking 2507", + "id": "openai/sora-2", + "name": "Sora-2", + "display_name": "Sora-2", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "video" + ] + }, "limit": { - "context": 131072, - "output": 114688 + "context": 0, + "output": 0 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-10-06", + "last_updated": "2025-10-06" }, { - "id": "qwen/qwen3-32b-fp8", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "openai/o1-pro", + "name": "o1-pro", + "display_name": "o1-pro", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 128000, - "output": 20000 + "context": 200000, + "output": 100000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-03-19", + "last_updated": "2025-03-19", + "cost": { + "input": 140, + "output": 540 + } }, { - "id": "qwen/qwen3-4b-fp8", - "name": "Qwen3 4B", - "display_name": "Qwen3 4B", + "id": "openai/gpt-5.2-codex", + "name": "gpt-5.2-codex", + "display_name": "gpt-5.2-codex", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 128000, - "output": 20000 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2026-01-14", + "last_updated": "2026-01-14", + "cost": { + "input": 1.6, + "output": 13, + "cache_read": 0.16 + } }, { - "id": "qwen/qwen3-8b-fp8", - "name": "Qwen3 8B", - "display_name": "Qwen3 8B", + "id": "openai/gpt-5.1-codex", + "name": "GPT-5.1-Codex", + "display_name": "GPT-5.1-Codex", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 128000, - "output": 20000 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-11-12", + "last_updated": "2025-11-12", + "cost": { + "input": 1.1, + "output": 9, + "cache_read": 0.11 + } }, { - "id": "qwen/qwen3-coder-30b-a3b-instruct", - "name": "Qwen3 Coder 30b A3B Instruct", - "display_name": "Qwen3 Coder 30b A3B Instruct", - "limit": { - "context": 262144, - "output": 65536 - }, - "tool_call": true, - "reasoning": { - "supported": false + "id": "openai/gpt-3.5-turbo-raw", + "name": "GPT-3.5-Turbo-Raw", + "display_name": "GPT-3.5-Turbo-Raw", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] }, - "type": "chat" - }, - { - "id": "qwen/qwen3-coder-480b-a35b-instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", "limit": { - "context": 262144, - "output": 65536 + "context": 4524, + "output": 2048 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2023-09-27", + "last_updated": "2023-09-27", + "cost": { + "input": 0.45, + "output": 1.4 + } }, { - "id": "qwen/qwen3-next-80b-a3b-instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "openai/gpt-4-classic", + "name": "GPT-4-Classic", + "display_name": "GPT-4-Classic", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 65536, - "output": 65536 + "context": 8192, + "output": 4096 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2024-03-25", + "last_updated": "2024-03-25", + "cost": { + "input": 27, + "output": 54 + } }, { - "id": "qwen/qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen3 Next 80B A3B Thinking", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1-mini", + "display_name": "GPT-4.1-mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1047576, + "output": 32768 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", + "cost": { + "input": 0.36, + "output": 1.4, + "cache_read": 0.09 + } + }, + { + "id": "openai/gpt-5-chat", + "name": "GPT-5-Chat", + "display_name": "GPT-5-Chat", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 1.1, + "output": 9, + "cache_read": 0.11 + } + }, + { + "id": "openai/o3-deep-research", + "name": "o3-deep-research", + "display_name": "o3-deep-research", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-06-27", + "last_updated": "2025-06-27", + "cost": { + "input": 9, + "output": 36, + "cache_read": 2.2 + } + }, + { + "id": "openai/gpt-4o-search", + "name": "GPT-4o-Search", + "display_name": "GPT-4o-Search", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 8192 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-03-11", + "last_updated": "2025-03-11", + "cost": { + "input": 2.2, + "output": 9 + } + }, + { + "id": "openai/gpt-image-1.5", + "name": "gpt-image-1.5", + "display_name": "gpt-image-1.5", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 128000, + "output": 0 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-16", + "last_updated": "2025-12-16" + }, + { + "id": "openai/gpt-image-1-mini", + "name": "GPT-Image-1-Mini", + "display_name": "GPT-Image-1-Mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-26", + "last_updated": "2025-08-26" + }, + { + "id": "openai/gpt-3.5-turbo", + "name": "GPT-3.5-Turbo", + "display_name": "GPT-3.5-Turbo", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16384, + "output": 2048 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2023-09-13", + "last_updated": "2023-09-13", + "cost": { + "input": 0.45, + "output": 1.4 + } + }, + { + "id": "openai/gpt-5.2-pro", + "name": "gpt-5.2-pro", + "display_name": "gpt-5.2-pro", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 19, + "output": 150 + } + }, + { + "id": "openai/o3-mini-high", + "name": "o3-mini-high", + "display_name": "o3-mini-high", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-01-31", + "last_updated": "2025-01-31", + "cost": { + "input": 0.99, + "output": 4 + } + }, + { + "id": "openai/chatgpt-4o-latest", + "name": "ChatGPT-4o-Latest", + "display_name": "ChatGPT-4o-Latest", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 8192 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2024-08-14", + "last_updated": "2024-08-14", + "cost": { + "input": 4.5, + "output": 14 + } + }, + { + "id": "openai/gpt-4-turbo", + "name": "GPT-4-Turbo", + "display_name": "GPT-4-Turbo", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2023-09-13", + "last_updated": "2023-09-13", + "cost": { + "input": 9, + "output": 27 + } + }, + { + "id": "openai/gpt-5.1-codex-mini", + "name": "GPT-5.1-Codex-Mini", + "display_name": "GPT-5.1-Codex-Mini", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-12", + "last_updated": "2025-11-12", + "cost": { + "input": 0.22, + "output": 1.8, + "cache_read": 0.022 + } + }, + { + "id": "openai/gpt-5.1-instant", + "name": "GPT-5.1-Instant", + "display_name": "GPT-5.1-Instant", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-12", + "last_updated": "2025-11-12", + "cost": { + "input": 1.1, + "output": 9, + "cache_read": 0.11 + } + }, + { + "id": "openai/o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-01-31", + "last_updated": "2025-01-31", + "cost": { + "input": 0.99, + "output": 4 + } + }, + { + "id": "openai/gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-12", + "last_updated": "2025-11-12", + "cost": { + "input": 1.1, + "output": 9, + "cache_read": 0.11 + } + }, + { + "id": "openai/gpt-5-nano", + "name": "GPT-5-nano", + "display_name": "GPT-5-nano", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0.045, + "output": 0.36, + "cache_read": 0.0045 + } + }, + { + "id": "openai/gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-09-23", + "last_updated": "2025-09-23", + "cost": { + "input": 1.1, + "output": 9 + } + }, + { + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 8192 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2024-05-13", + "last_updated": "2024-05-13" + }, + { + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1047576, + "output": 32768 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 1.8, + "output": 7.2, + "cache_read": 0.45 + } + }, + { + "id": "openai/o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "cost": { + "input": 0.99, + "output": 4, + "cache_read": 0.25 + } + }, + { + "id": "openai/o1", + "name": "o1", + "display_name": "o1", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2024-12-18", + "last_updated": "2024-12-18", + "cost": { + "input": 14, + "output": 54 + } + }, + { + "id": "openai/gpt-5-mini", + "name": "GPT-5-mini", + "display_name": "GPT-5-mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-06-25", + "last_updated": "2025-06-25", + "cost": { + "input": 0.22, + "output": 1.8, + "cache_read": 0.022 + } + }, + { + "id": "openai/gpt-4o-aug", + "name": "GPT-4o-Aug", + "display_name": "GPT-4o-Aug", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 8192 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2024-11-21", + "last_updated": "2024-11-21", + "cost": { + "input": 2.2, + "output": 9, + "cache_read": 1.1 + } + }, + { + "id": "openai/o3-pro", + "name": "o3-pro", + "display_name": "o3-pro", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-06-10", + "last_updated": "2025-06-10", + "cost": { + "input": 18, + "output": 72 + } + }, + { + "id": "openai/gpt-image-1", + "name": "GPT-Image-1", + "display_name": "GPT-Image-1", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 128000, + "output": 0 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-03-31", + "last_updated": "2025-03-31" + }, + { + "id": "openai/gpt-5.1-codex-max", + "name": "gpt-5.1-codex-max", + "display_name": "gpt-5.1-codex-max", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-08", + "last_updated": "2025-12-08", + "cost": { + "input": 1.1, + "output": 9, + "cache_read": 0.11 + } + }, + { + "id": "openai/gpt-3.5-turbo-instruct", + "name": "GPT-3.5-Turbo-Instruct", + "display_name": "GPT-3.5-Turbo-Instruct", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 3500, + "output": 1024 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2023-09-20", + "last_updated": "2023-09-20", + "cost": { + "input": 1.4, + "output": 1.8 + } + }, + { + "id": "openai/o3", + "name": "o3", + "display_name": "o3", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "cost": { + "input": 1.8, + "output": 7.2, + "cache_read": 0.45 + } + }, + { + "id": "openai/o4-mini-deep-research", + "name": "o4-mini-deep-research", + "display_name": "o4-mini-deep-research", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-06-27", + "last_updated": "2025-06-27", + "cost": { + "input": 1.8, + "output": 7.2, + "cache_read": 0.45 + } + }, + { + "id": "openai/gpt-4-classic-0314", + "name": "GPT-4-Classic-0314", + "display_name": "GPT-4-Classic-0314", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 4096 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2024-08-26", + "last_updated": "2024-08-26", + "cost": { + "input": 27, + "output": 54 + } + }, + { + "id": "openai/gpt-4o-mini", + "name": "GPT-4o-mini", + "display_name": "GPT-4o-mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "cost": { + "input": 0.14, + "output": 0.54, + "cache_read": 0.068 + } + }, + { + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 1.1, + "output": 9, + "cache_read": 0.11 + } + }, + { + "id": "openai/dall-e-3", + "name": "DALL-E-3", + "display_name": "DALL-E-3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 800, + "output": 0 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2023-11-06", + "last_updated": "2023-11-06" + }, + { + "id": "openai/sora-2-pro", + "name": "Sora-2-Pro", + "display_name": "Sora-2-Pro", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "video" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-06", + "last_updated": "2025-10-06" + }, + { + "id": "openai/gpt-5-pro", + "name": "GPT-5-Pro", + "display_name": "GPT-5-Pro", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-06", + "last_updated": "2025-10-06", + "cost": { + "input": 14, + "output": 110 + } + }, + { + "id": "openai/gpt-5.2", + "name": "gpt-5.2", + "display_name": "gpt-5.2", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-08", + "last_updated": "2025-12-08", + "cost": { + "input": 1.6, + "output": 13, + "cache_read": 0.16 + } + }, + { + "id": "openai/gpt-4o-mini-search", + "name": "GPT-4o-mini-Search", + "display_name": "GPT-4o-mini-Search", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 8192 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-03-11", + "last_updated": "2025-03-11", + "cost": { + "input": 0.14, + "output": 0.54 + } + }, + { + "id": "stabilityai/stablediffusionxl", + "name": "StableDiffusionXL", + "display_name": "StableDiffusionXL", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 200, + "output": 0 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2023-07-09", + "last_updated": "2023-07-09" + }, + { + "id": "topazlabs-co/topazlabs", + "name": "TopazLabs", + "display_name": "TopazLabs", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 204, + "output": 0 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2024-12-03", + "last_updated": "2024-12-03" + }, + { + "id": "lumalabs/ray2", + "name": "Ray2", + "display_name": "Ray2", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "video" + ] + }, + "limit": { + "context": 5000, + "output": 0 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-02-20", + "last_updated": "2025-02-20" + }, + { + "id": "anthropic/claude-opus-4", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 192512, + "output": 32768 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-05-21", + "last_updated": "2025-05-21", + "cost": { + "input": 13, + "output": 64, + "cache_read": 1.3, + "cache_write": 16 + } + }, + { + "id": "anthropic/claude-sonnet-3.7", + "name": "Claude Sonnet 3.7", + "display_name": "Claude Sonnet 3.7", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 196608, + "output": 32768 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-02-19", + "last_updated": "2025-02-19", + "cost": { + "input": 2.6, + "output": 13, + "cache_read": 0.26, + "cache_write": 3.2 + } + }, + { + "id": "anthropic/claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 192000, + "output": 64000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "cost": { + "input": 0.85, + "output": 4.3, + "cache_read": 0.085, + "cache_write": 1.1 + } + }, + { + "id": "anthropic/claude-opus-4-6", + "name": "claude-opus-4-6", + "display_name": "claude-opus-4-6", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 983040, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-04", + "last_updated": "2026-02-04", + "cost": { + "input": 4.3, + "output": 21, + "cache_read": 0.43, + "cache_write": 5.3 + } + }, + { + "id": "anthropic/claude-haiku-3", + "name": "Claude-Haiku-3", + "display_name": "Claude-Haiku-3", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 189096, + "output": 8192 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2024-03-09", + "last_updated": "2024-03-09", + "cost": { + "input": 0.21, + "output": 1.1, + "cache_read": 0.021, + "cache_write": 0.26 + } + }, + { + "id": "anthropic/claude-opus-4.1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 196608, + "output": 32000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 13, + "output": 64, + "cache_read": 1.3, + "cache_write": 16 + } + }, + { + "id": "anthropic/claude-sonnet-3.5", + "name": "Claude-Sonnet-3.5", + "display_name": "Claude-Sonnet-3.5", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 189096, + "output": 8192 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2024-06-05", + "last_updated": "2024-06-05", + "cost": { + "input": 2.6, + "output": 13, + "cache_read": 0.26, + "cache_write": 3.2 + } + }, + { + "id": "anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 983040, + "output": 32768 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-05-21", + "last_updated": "2025-05-21", + "cost": { + "input": 2.6, + "output": 13, + "cache_read": 0.26, + "cache_write": 3.2 + } + }, + { + "id": "anthropic/claude-opus-4.5", + "name": "claude-opus-4.5", + "display_name": "claude-opus-4.5", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 196608, + "output": 64000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-21", + "last_updated": "2025-11-21", + "cost": { + "input": 4.3, + "output": 21, + "cache_read": 0.43, + "cache_write": 5.3 + } + }, + { + "id": "anthropic/claude-haiku-3.5", + "name": "Claude-Haiku-3.5", + "display_name": "Claude-Haiku-3.5", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 189096, + "output": 8192 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2024-10-01", + "last_updated": "2024-10-01", + "cost": { + "input": 0.68, + "output": 3.4, + "cache_read": 0.068, + "cache_write": 0.85 + } + }, + { + "id": "anthropic/claude-sonnet-3.5-june", + "name": "Claude-Sonnet-3.5-June", + "display_name": "Claude-Sonnet-3.5-June", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 189096, + "output": 8192 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2024-11-18", + "last_updated": "2024-11-18", + "cost": { + "input": 2.6, + "output": 13, + "cache_read": 0.26, + "cache_write": 3.2 + } + }, + { + "id": "anthropic/claude-sonnet-4.5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 983040, + "output": 32768 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-09-26", + "last_updated": "2025-09-26", + "cost": { + "input": 2.6, + "output": 13, + "cache_read": 0.26, + "cache_write": 3.2 + } + }, + { + "id": "trytako/tako", + "name": "Tako", + "display_name": "Tako", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 2048, + "output": 0 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2024-08-15", + "last_updated": "2024-08-15" + }, + { + "id": "novita/glm-4.7", + "name": "glm-4.7", + "display_name": "glm-4.7", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 205000, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-22", + "last_updated": "2025-12-22" + }, + { + "id": "novita/kimi-k2.5", + "name": "kimi-k2.5", + "display_name": "kimi-k2.5", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 262144 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-01-27", + "last_updated": "2026-01-27" + }, + { + "id": "novita/glm-4.7-flash", + "name": "glm-4.7-flash", + "display_name": "glm-4.7-flash", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 65500 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-01-19", + "last_updated": "2026-01-19" + }, + { + "id": "novita/kimi-k2-thinking", + "name": "kimi-k2-thinking", + "display_name": "kimi-k2-thinking", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 0 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-07", + "last_updated": "2025-11-07" + }, + { + "id": "novita/glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-09-30", + "last_updated": "2025-09-30" + }, + { + "id": "novita/glm-4.7-n", + "name": "glm-4.7-n", + "display_name": "glm-4.7-n", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 205000, + "output": 131072 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-22", + "last_updated": "2025-12-22" + }, + { + "id": "novita/minimax-m2.1", + "name": "minimax-m2.1", + "display_name": "minimax-m2.1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 205000, + "output": 131072 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-26", + "last_updated": "2025-12-26" + }, + { + "id": "novita/glm-4.6v", + "name": "glm-4.6v", + "display_name": "glm-4.6v", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131000, + "output": 32768 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-09", + "last_updated": "2025-12-09" + }, + { + "id": "cerebras/llama-3.1-8b-cs", + "name": "llama-3.1-8b-cs", + "display_name": "llama-3.1-8b-cs", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-05-13", + "last_updated": "2025-05-13" + }, + { + "id": "cerebras/gpt-oss-120b-cs", + "name": "gpt-oss-120b-cs", + "display_name": "gpt-oss-120b-cs", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-06", + "last_updated": "2025-08-06" + }, + { + "id": "cerebras/qwen3-235b-2507-cs", + "name": "qwen3-235b-2507-cs", + "display_name": "qwen3-235b-2507-cs", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-06", + "last_updated": "2025-08-06" + }, + { + "id": "cerebras/qwen3-32b-cs", + "name": "qwen3-32b-cs", + "display_name": "qwen3-32b-cs", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-05-15", + "last_updated": "2025-05-15" + }, + { + "id": "cerebras/llama-3.3-70b-cs", + "name": "llama-3.3-70b-cs", + "display_name": "llama-3.3-70b-cs", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 0, + "output": 0 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-05-13", + "last_updated": "2025-05-13" + } + ] + }, + "minimax-cn-coding-plan": { + "id": "minimax-cn-coding-plan", + "name": "MiniMax Coding Plan (minimaxi.com)", + "display_name": "MiniMax Coding Plan (minimaxi.com)", + "api": "https://api.minimaxi.com/anthropic/v1", + "doc": "https://platform.minimaxi.com/docs/coding-plan/intro", + "models": [ + { + "id": "MiniMax-M2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 196608, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", + "cost": { + "input": 0, + "output": 0 + } + }, + { + "id": "MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "cost": { + "input": 0, + "output": 0 + } + } + ] + }, + "cerebras": { + "id": "cerebras", + "name": "Cerebras", + "display_name": "Cerebras", + "doc": "https://inference-docs.cerebras.ai/models/overview", + "models": [ + { + "id": "zai-glm-4.7", + "name": "Z.AI GLM-4.7", + "display_name": "Z.AI GLM-4.7", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 40000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-01-10", + "last_updated": "2026-01-10", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } + }, + { + "id": "qwen-3-235b-a22b-instruct-2507", + "name": "Qwen 3 235B Instruct", + "display_name": "Qwen 3 235B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131000, + "output": 32000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-22", + "last_updated": "2025-07-22", + "cost": { + "input": 0.6, + "output": 1.2 + } + }, + { + "id": "gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0.25, + "output": 0.69 + } + } + ] + }, + "ollama": { + "id": "ollama", + "name": "Ollama Cloud", + "display_name": "Ollama Cloud", + "api": "https://ollama.com/v1", + "doc": "https://docs.ollama.com/cloud", + "models": [ + { + "id": "all-minilm:latest", + "name": "All-MiniLM Latest", + "display_name": "All-MiniLM Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 512, + "output": 0 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "all-minilm:22m", + "name": "All-MiniLM 22M", + "display_name": "All-MiniLM 22M", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 512, + "output": 0 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "all-minilm:33m", + "name": "All-MiniLM 33M", + "display_name": "All-MiniLM 33M", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 512, + "output": 0 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "llava-llama3:latest", + "name": "LLaVA-Llama3 Latest", + "display_name": "LLaVA-Llama3 Latest", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8000, + "output": 2000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "llava-llama3:8b", + "name": "LLaVA-Llama3 8B", + "display_name": "LLaVA-Llama3 8B", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8000, + "output": 2000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "falcon3:latest", + "name": "Falcon3 Latest", + "display_name": "Falcon3 Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "falcon3:1b", + "name": "Falcon3 1B", + "display_name": "Falcon3 1B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8000, + "output": 2000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "falcon3:3b", + "name": "Falcon3 3B", + "display_name": "Falcon3 3B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "falcon3:7b", + "name": "Falcon3 7B", + "display_name": "Falcon3 7B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "falcon3:10b", + "name": "Falcon3 10B", + "display_name": "Falcon3 10B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "snowflake-arctic-embed:latest", + "name": "Snowflake Arctic Embed Latest", + "display_name": "Snowflake Arctic Embed Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 512, + "output": 0 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "snowflake-arctic-embed:22m", + "name": "Snowflake Arctic Embed 22M", + "display_name": "Snowflake Arctic Embed 22M", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 512, + "output": 0 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "snowflake-arctic-embed:33m", + "name": "Snowflake Arctic Embed 33M", + "display_name": "Snowflake Arctic Embed 33M", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 512, + "output": 0 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "snowflake-arctic-embed:110m", + "name": "Snowflake Arctic Embed 110M", + "display_name": "Snowflake Arctic Embed 110M", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 512, + "output": 0 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "snowflake-arctic-embed:137m", + "name": "Snowflake Arctic Embed 137M", + "display_name": "Snowflake Arctic Embed 137M", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 2000, + "output": 0 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "snowflake-arctic-embed:335m", + "name": "Snowflake Arctic Embed 335M", + "display_name": "Snowflake Arctic Embed 335M", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 512, + "output": 0 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "openthinker:latest", + "name": "OpenThinker Latest", + "display_name": "OpenThinker Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8000 + }, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "openthinker:7b", + "name": "OpenThinker 7B", + "display_name": "OpenThinker 7B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8000 + }, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "openthinker:32b", + "name": "OpenThinker 32B", + "display_name": "OpenThinker 32B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8000 + }, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "codestral:latest", + "name": "Codestral Latest", + "display_name": "Codestral Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "codestral:22b", + "name": "Codestral 22B", + "display_name": "Codestral 22B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "granite4:latest", + "name": "Granite 4 Latest", + "display_name": "Granite 4 Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "granite4:350m", + "name": "Granite 4 350M", + "display_name": "Granite 4 350M", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "granite4:1b", + "name": "Granite 4 1B", + "display_name": "Granite 4 1B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "granite4:3b", + "name": "Granite 4 3B", + "display_name": "Granite 4 3B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "moondream:latest", + "name": "Moondream Latest", + "display_name": "Moondream Latest", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 2000, + "output": 500 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "moondream:1.8b", + "name": "Moondream 1.8B", + "display_name": "Moondream 1.8B", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 2000, + "output": 500 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "granite-code:latest", + "name": "Granite Code Latest", + "display_name": "Granite Code Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 125000, + "output": 31250 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "granite-code:3b", + "name": "Granite Code 3B", + "display_name": "Granite Code 3B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 125000, + "output": 31250 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "granite-code:8b", + "name": "Granite Code 8B", + "display_name": "Granite Code 8B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 125000, + "output": 31250 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "granite-code:20b", + "name": "Granite Code 20B", + "display_name": "Granite Code 20B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8000, + "output": 2000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "granite-code:34b", + "name": "Granite Code 34B", + "display_name": "Granite Code 34B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8000, + "output": 2000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "smollm:latest", + "name": "SmolLM Latest", + "display_name": "SmolLM Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "smollm:135m", + "name": "SmolLM 135M", + "display_name": "SmolLM 135M", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "smollm:360m", + "name": "SmolLM 360M", + "display_name": "SmolLM 360M", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "smollm:1.7b", + "name": "SmolLM 1.7B", + "display_name": "SmolLM 1.7B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "phi:latest", + "name": "Phi Latest", + "display_name": "Phi Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 2000, + "output": 500 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "phi:2.7b", + "name": "Phi 2.7B", + "display_name": "Phi 2.7B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 2000, + "output": 500 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "mistral-large:latest", + "name": "Mistral Large Latest", + "display_name": "Mistral Large Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "mistral-large:123b", + "name": "Mistral Large 123B", + "display_name": "Mistral Large 123B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "zephyr:latest", + "name": "Zephyr Latest", + "display_name": "Zephyr Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "zephyr:7b", + "name": "Zephyr 7B", + "display_name": "Zephyr 7B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "zephyr:141b", + "name": "Zephyr 141B", + "display_name": "Zephyr 141B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "yi:latest", + "name": "Yi Latest", + "display_name": "Yi Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "yi:6b", + "name": "Yi 6B", + "display_name": "Yi 6B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "yi:9b", + "name": "Yi 9B", + "display_name": "Yi 9B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "yi:34b", + "name": "Yi 34B", + "display_name": "Yi 34B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "embeddinggemma:latest", + "name": "EmbeddingGemma Latest", + "display_name": "EmbeddingGemma Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 2000, + "output": 0 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "embeddinggemma:300m", + "name": "EmbeddingGemma 300M", + "display_name": "EmbeddingGemma 300M", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 2000, + "output": 0 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "gpt-oss-safeguard:latest", + "name": "GPT-OSS Safeguard Latest", + "display_name": "GPT-OSS Safeguard Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "gpt-oss-safeguard:20b", + "name": "GPT-OSS Safeguard 20B", + "display_name": "GPT-OSS Safeguard 20B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "gpt-oss-safeguard:120b", + "name": "GPT-OSS Safeguard 120B", + "display_name": "GPT-OSS Safeguard 120B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "minimax-m2:cloud", + "name": "MiniMax M2 Cloud", + "display_name": "MiniMax M2 Cloud", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "cogito-2.1:cloud", + "name": "Cogito 2.1 Cloud", + "display_name": "Cogito 2.1 Cloud", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "minimax-m2.1:cloud", + "name": "MiniMax M2.1 Cloud", + "display_name": "MiniMax M2.1 Cloud", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "deepseek-ocr:latest", + "name": "DeepSeek OCR Latest", + "display_name": "DeepSeek OCR Latest", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "deepseek-ocr:3b", + "name": "DeepSeek OCR 3B", + "display_name": "DeepSeek OCR 3B", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "gemini-3-pro-preview:latest", + "name": "gemini-3-pro-preview", + "display_name": "gemini-3-pro-preview", + "modalities": { + "input": [ + "image", + "text", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "open_weights": false, + "knowledge": "2025-10", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", + "type": "chat" + }, + { + "id": "gpt-oss:latest", + "name": "GPT-OSS Latest", + "display_name": "GPT-OSS Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "gpt-oss:20b", + "name": "gpt-oss:20b", + "display_name": "gpt-oss:20b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2026-01-19", + "type": "chat" + }, + { + "id": "gpt-oss:120b", + "name": "gpt-oss:120b", + "display_name": "gpt-oss:120b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2026-01-19", + "type": "chat" + }, + { + "id": "gpt-oss:20b-cloud", + "name": "GPT-OSS 20B Cloud", + "display_name": "GPT-OSS 20B Cloud", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "gpt-oss:120b-cloud", + "name": "GPT-OSS 120B Cloud", + "display_name": "GPT-OSS 120B Cloud", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "qwen3-vl:latest", + "name": "Qwen3-VL Latest", + "display_name": "Qwen3-VL Latest", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen3-vl:2b", + "name": "Qwen3-VL 2B", + "display_name": "Qwen3-VL 2B", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen3-vl:4b", + "name": "Qwen3-VL 4B", + "display_name": "Qwen3-VL 4B", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen3-vl:8b", + "name": "Qwen3-VL 8B", + "display_name": "Qwen3-VL 8B", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen3-vl:30b", + "name": "Qwen3-VL 30B", + "display_name": "Qwen3-VL 30B", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen3-vl:32b", + "name": "Qwen3-VL 32B", + "display_name": "Qwen3-VL 32B", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen3-vl:235b", + "name": "qwen3-vl:235b", + "display_name": "qwen3-vl:235b", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-09-22", + "last_updated": "2026-01-19", + "type": "chat" + }, + { + "id": "qwen3-vl:235b-cloud", + "name": "Qwen3-VL 235B Cloud", + "display_name": "Qwen3-VL 235B Cloud", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen3-vl:235b-instruct-cloud", + "name": "Qwen3-VL 235B Instruct Cloud", + "display_name": "Qwen3-VL 235B Instruct Cloud", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "deepseek-r1:latest", + "name": "DeepSeek-R1 Latest", + "display_name": "DeepSeek-R1 Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "deepseek-r1:1.5b", + "name": "DeepSeek-R1 1.5B", + "display_name": "DeepSeek-R1 1.5B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "deepseek-r1:7b", + "name": "DeepSeek-R1 7B", + "display_name": "DeepSeek-R1 7B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "deepseek-r1:8b", + "name": "DeepSeek-R1 8B", + "display_name": "DeepSeek-R1 8B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "deepseek-r1:14b", + "name": "DeepSeek-R1 14B", + "display_name": "DeepSeek-R1 14B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "deepseek-r1:32b", + "name": "DeepSeek-R1 32B", + "display_name": "DeepSeek-R1 32B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "deepseek-r1:70b", + "name": "DeepSeek-R1 70B", + "display_name": "DeepSeek-R1 70B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "deepseek-r1:671b", + "name": "DeepSeek-R1 671B", + "display_name": "DeepSeek-R1 671B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 160000, + "output": 40000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "qwen3-coder:latest", + "name": "Qwen3-Coder Latest", + "display_name": "Qwen3-Coder Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen3-coder:30b", + "name": "Qwen3-Coder 30B", + "display_name": "Qwen3-Coder 30B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen3-coder:480b", + "name": "qwen3-coder:480b", + "display_name": "qwen3-coder:480b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-07-22", + "last_updated": "2026-01-19", + "type": "chat" + }, + { + "id": "qwen3-coder:480b-cloud", + "name": "Qwen3-Coder 480B Cloud", + "display_name": "Qwen3-Coder 480B Cloud", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "gemma3:latest", + "name": "Gemma3 Latest", + "display_name": "Gemma3 Latest", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "gemma3:270m", + "name": "Gemma3 270M", + "display_name": "Gemma3 270M", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "gemma3:1b", + "name": "Gemma3 1B", + "display_name": "Gemma3 1B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "gemma3:4b", + "name": "gemma3:4b", + "display_name": "gemma3:4b", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 131072 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2024-12-01", + "last_updated": "2026-01-19", + "type": "chat" + }, + { + "id": "gemma3:12b", + "name": "gemma3:12b", + "display_name": "gemma3:12b", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 131072 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2024-12-01", + "last_updated": "2026-01-19", + "type": "chat" + }, + { + "id": "gemma3:27b", + "name": "gemma3:27b", + "display_name": "gemma3:27b", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 131072 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-07-27", + "last_updated": "2026-01-19", + "type": "chat" + }, + { + "id": "glm-4.6:cloud", + "name": "GLM-4.6 Cloud", + "display_name": "GLM-4.6 Cloud", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 198000, + "output": 49500 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "kimi-k2.5:cloud", + "name": "Kimi K2.5 Cloud", + "display_name": "Kimi K2.5 Cloud", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 64000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "qwen3:latest", + "name": "Qwen3 Latest", + "display_name": "Qwen3 Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 40000, + "output": 10000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "qwen3:0.6b", + "name": "Qwen3 0.6B", + "display_name": "Qwen3 0.6B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 40000, + "output": 10000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "qwen3:1.7b", + "name": "Qwen3 1.7B", + "display_name": "Qwen3 1.7B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 40000, + "output": 10000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "qwen3:4b", + "name": "Qwen3 4B", + "display_name": "Qwen3 4B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "qwen3:8b", + "name": "Qwen3 8B", + "display_name": "Qwen3 8B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 40000, + "output": 10000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "qwen3:14b", + "name": "Qwen3 14B", + "display_name": "Qwen3 14B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 40000, + "output": 10000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "qwen3:30b", + "name": "Qwen3 30B", + "display_name": "Qwen3 30B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "qwen3:32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 40000, + "output": 10000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "qwen3:235b", + "name": "Qwen3 235B", + "display_name": "Qwen3 235B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "deepseek-v3.1:latest", + "name": "DeepSeek-V3.1 Latest", + "display_name": "DeepSeek-V3.1 Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 160000, + "output": 40000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "deepseek-v3.1:671b", + "name": "deepseek-v3.1:671b", + "display_name": "deepseek-v3.1:671b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 163840, + "output": 163840 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-21", + "last_updated": "2026-01-19", + "type": "chat" + }, + { + "id": "deepseek-v3.1:671b-cloud", + "name": "DeepSeek-V3.1 671B Cloud", + "display_name": "DeepSeek-V3.1 671B Cloud", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 160000, + "output": 40000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "llama3.1:latest", + "name": "Llama 3.1 Latest", + "display_name": "Llama 3.1 Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "llama3.1:8b", + "name": "Llama 3.1 8B", + "display_name": "Llama 3.1 8B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "llama3.1:70b", + "name": "Llama 3.1 70B", + "display_name": "Llama 3.1 70B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "llama3.1:405b", + "name": "Llama 3.1 405B", + "display_name": "Llama 3.1 405B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "llama3.2:latest", + "name": "Llama 3.2 Latest", + "display_name": "Llama 3.2 Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "llama3.2:1b", + "name": "Llama 3.2 1B", + "display_name": "Llama 3.2 1B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "llama3.2:3b", + "name": "Llama 3.2 3B", + "display_name": "Llama 3.2 3B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "phi3:latest", + "name": "Phi-3 Latest", + "display_name": "Phi-3 Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "phi3:3.8b", + "name": "Phi-3 3.8B", + "display_name": "Phi-3 3.8B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "phi3:14b", + "name": "Phi-3 14B", + "display_name": "Phi-3 14B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "mistral-nemo:latest", + "name": "Mistral-Nemo Latest", + "display_name": "Mistral-Nemo Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 250000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "mistral-nemo:12b", + "name": "Mistral-Nemo 12B", + "display_name": "Mistral-Nemo 12B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 250000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "llava:latest", + "name": "LLaVA Latest", + "display_name": "LLaVA Latest", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "llava:7b", + "name": "LLaVA 7B", + "display_name": "LLaVA 7B", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "llava:13b", + "name": "LLaVA 13B", + "display_name": "LLaVA 13B", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 4000, + "output": 1000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "llava:34b", + "name": "LLaVA 34B", + "display_name": "LLaVA 34B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 4000, + "output": 1000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "codellama:latest", + "name": "CodeLlama Latest", + "display_name": "CodeLlama Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16000, + "output": 4000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "codellama:7b", + "name": "CodeLlama 7B", + "display_name": "CodeLlama 7B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16000, + "output": 4000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "codellama:13b", + "name": "CodeLlama 13B", + "display_name": "CodeLlama 13B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16000, + "output": 4000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "codellama:34b", + "name": "CodeLlama 34B", + "display_name": "CodeLlama 34B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16000, + "output": 4000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "codellama:70b", + "name": "CodeLlama 70B", + "display_name": "CodeLlama 70B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 2000, + "output": 500 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "mixtral:latest", + "name": "Mixtral Latest", + "display_name": "Mixtral Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "mixtral:8x7b", + "name": "Mixtral 8x7B", + "display_name": "Mixtral 8x7B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "mixtral:8x22b", + "name": "Mixtral 8x22B", + "display_name": "Mixtral 8x22B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 64000, + "output": 16000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "deepseek-coder:latest", + "name": "DeepSeek-Coder Latest", + "display_name": "DeepSeek-Coder Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16000, + "output": 4000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "deepseek-coder:1.3b", + "name": "DeepSeek-Coder 1.3B", + "display_name": "DeepSeek-Coder 1.3B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16000, + "output": 4000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "deepseek-coder:6.7b", + "name": "DeepSeek-Coder 6.7B", + "display_name": "DeepSeek-Coder 6.7B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16000, + "output": 4000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "deepseek-coder:33b", + "name": "DeepSeek-Coder 33B", + "display_name": "DeepSeek-Coder 33B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16000, + "output": 4000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen2.5vl:latest", + "name": "Qwen2.5-VL Latest", + "display_name": "Qwen2.5-VL Latest", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 125000, + "output": 31250 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen2.5vl:3b", + "name": "Qwen2.5-VL 3B", + "display_name": "Qwen2.5-VL 3B", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 125000, + "output": 31250 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen2.5vl:7b", + "name": "Qwen2.5-VL 7B", + "display_name": "Qwen2.5-VL 7B", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 125000, + "output": 31250 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen2.5vl:32b", + "name": "Qwen2.5-VL 32B", + "display_name": "Qwen2.5-VL 32B", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 125000, + "output": 31250 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen2.5vl:72b", + "name": "Qwen2.5-VL 72B", + "display_name": "Qwen2.5-VL 72B", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 125000, + "output": 31250 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "nomic-embed-text:latest", + "name": "Nomic-Embed-Text Latest", + "display_name": "Nomic-Embed-Text Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 2000, + "output": 0 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "nomic-embed-text:v1.5", + "name": "Nomic-Embed-Text v1.5", + "display_name": "Nomic-Embed-Text v1.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 2000, + "output": 0 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "nomic-embed-text:137m-v1.5-fp16", + "name": "Nomic-Embed-Text 137M v1.5 FP16", + "display_name": "Nomic-Embed-Text 137M v1.5 FP16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 2000, + "output": 0 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "qwq:latest", + "name": "QwQ Latest", + "display_name": "QwQ Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 40000, + "output": 10000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "qwq:32b", + "name": "QwQ 32B", + "display_name": "QwQ 32B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 40000, + "output": 10000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "mistral:latest", + "name": "Mistral Latest", + "display_name": "Mistral Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "mistral:7b", + "name": "Mistral 7B", + "display_name": "Mistral 7B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32000, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "mistral-large-3:675b-cloud", + "name": "Mistral Large 3 675B Cloud", + "display_name": "Mistral Large 3 675B Cloud", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:latest", + "name": "Ministral 3 Latest", + "display_name": "Ministral 3 Latest", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:3b", + "name": "ministral-3:3b", + "display_name": "ministral-3:3b", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2024-10-22", + "last_updated": "2026-01-19", + "type": "chat" + }, + { + "id": "ministral-3:8b", + "name": "ministral-3:8b", + "display_name": "ministral-3:8b", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2024-12-01", + "last_updated": "2026-01-19", + "type": "chat" + }, + { + "id": "ministral-3:14b", + "name": "ministral-3:14b", + "display_name": "ministral-3:14b", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2024-12-01", + "last_updated": "2026-01-19", + "type": "chat" + }, + { + "id": "ministral-3:3b-cloud", + "name": "Ministral 3 3B Cloud", + "display_name": "Ministral 3 3B Cloud", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:8b-cloud", + "name": "Ministral 3 8B Cloud", + "display_name": "Ministral 3 8B Cloud", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:14b-cloud", + "name": "Ministral 3 14B Cloud", + "display_name": "Ministral 3 14B Cloud", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:3b-instruct-2512-q4_K_M", + "name": "Ministral 3 3B Instruct 2512 Q4_K_M", + "display_name": "Ministral 3 3B Instruct 2512 Q4_K_M", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:3b-instruct-2512-q8_0", + "name": "Ministral 3 3B Instruct 2512 Q8_0", + "display_name": "Ministral 3 3B Instruct 2512 Q8_0", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:3b-instruct-2512-fp16", + "name": "Ministral 3 3B Instruct 2512 FP16", + "display_name": "Ministral 3 3B Instruct 2512 FP16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:8b-instruct-2512-q4_K_M", + "name": "Ministral 3 8B Instruct 2512 Q4_K_M", + "display_name": "Ministral 3 8B Instruct 2512 Q4_K_M", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:8b-instruct-2512-q8_0", + "name": "Ministral 3 8B Instruct 2512 Q8_0", + "display_name": "Ministral 3 8B Instruct 2512 Q8_0", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:8b-instruct-2512-fp16", + "name": "Ministral 3 8B Instruct 2512 FP16", + "display_name": "Ministral 3 8B Instruct 2512 FP16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:14b-instruct-2512-q4_K_M", + "name": "Ministral 3 14B Instruct 2512 Q4_K_M", + "display_name": "Ministral 3 14B Instruct 2512 Q4_K_M", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:14b-instruct-2512-q8_0", + "name": "Ministral 3 14B Instruct 2512 Q8_0", + "display_name": "Ministral 3 14B Instruct 2512 Q8_0", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "ministral-3:14b-instruct-2512-fp16", + "name": "Ministral 3 14B Instruct 2512 FP16", + "display_name": "Ministral 3 14B Instruct 2512 FP16", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen2.5:latest", + "name": "Qwen2.5 Latest", + "display_name": "Qwen2.5 Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen2.5:0.5b", + "name": "Qwen2.5 0.5B", + "display_name": "Qwen2.5 0.5B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen2.5:1.5b", + "name": "Qwen2.5 1.5B", + "display_name": "Qwen2.5 1.5B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen2.5:3b", + "name": "Qwen2.5 3B", + "display_name": "Qwen2.5 3B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen2.5:7b", + "name": "Qwen2.5 7B", + "display_name": "Qwen2.5 7B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen2.5:14b", + "name": "Qwen2.5 14B", + "display_name": "Qwen2.5 14B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen2.5:32b", + "name": "Qwen2.5 32B", + "display_name": "Qwen2.5 32B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen2.5:72b", + "name": "Qwen2.5 72B", + "display_name": "Qwen2.5 72B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "llama3:latest", + "name": "Llama 3 Latest", + "display_name": "Llama 3 Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8000, + "output": 2000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "llama3:8b", + "name": "Llama 3 8B", + "display_name": "Llama 3 8B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8000, + "output": 2000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "llama3:70b", + "name": "Llama 3 70B", + "display_name": "Llama 3 70B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8000, + "output": 2000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "gemma2:latest", + "name": "Gemma 2 Latest", + "display_name": "Gemma 2 Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "gemma2:2b", + "name": "Gemma 2 2B", + "display_name": "Gemma 2 2B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "gemma2:9b", + "name": "Gemma 2 9B", + "display_name": "Gemma 2 9B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "gemma2:27b", + "name": "Gemma 2 27B", + "display_name": "Gemma 2 27B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen2.5-coder:latest", + "name": "Qwen2.5-Coder Latest", + "display_name": "Qwen2.5-Coder Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen2.5-coder:0.5b", + "name": "Qwen2.5-Coder 0.5B", + "display_name": "Qwen2.5-Coder 0.5B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen2.5-coder:1.5b", + "name": "Qwen2.5-Coder 1.5B", + "display_name": "Qwen2.5-Coder 1.5B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen2.5-coder:3b", + "name": "Qwen2.5-Coder 3B", + "display_name": "Qwen2.5-Coder 3B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen2.5-coder:7b", + "name": "Qwen2.5-Coder 7B", + "display_name": "Qwen2.5-Coder 7B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen2.5-coder:14b", + "name": "Qwen2.5-Coder 14B", + "display_name": "Qwen2.5-Coder 14B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen2.5-coder:32b", + "name": "Qwen2.5-Coder 32B", + "display_name": "Qwen2.5-Coder 32B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "phi4:latest", + "name": "Phi-4 Latest", + "display_name": "Phi-4 Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16000, + "output": 4000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "phi4:14b", + "name": "Phi-4 14B", + "display_name": "Phi-4 14B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16000, + "output": 4000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "gemma:latest", + "name": "Gemma Latest", + "display_name": "Gemma Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "gemma:2b", + "name": "Gemma 2B", + "display_name": "Gemma 2B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "gemma:7b", + "name": "Gemma 7B", + "display_name": "Gemma 7B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "llama2:latest", + "name": "Llama 2 Latest", + "display_name": "Llama 2 Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 4096, + "output": 1024 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "llama2:7b", + "name": "Llama 2 7B", + "display_name": "Llama 2 7B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 4096, + "output": 1024 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "llama2:13b", + "name": "Llama 2 13B", + "display_name": "Llama 2 13B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 4096, + "output": 1024 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "llama2:70b", + "name": "Llama 2 70B", + "display_name": "Llama 2 70B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 4096, + "output": 1024 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen2:latest", + "name": "Qwen2 Latest", + "display_name": "Qwen2 Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen2:0.5b", + "name": "Qwen2 0.5B", + "display_name": "Qwen2 0.5B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen2:1.5b", + "name": "Qwen2 1.5B", + "display_name": "Qwen2 1.5B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen2:7b", + "name": "Qwen2 7B", + "display_name": "Qwen2 7B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen2:72b", + "name": "Qwen2 72B", + "display_name": "Qwen2 72B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "deepseek-v3:latest", + "name": "DeepSeek-V3 Latest", + "display_name": "DeepSeek-V3 Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 160000, + "output": 40000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "deepseek-v3:671b", + "name": "DeepSeek-V3 671B", + "display_name": "DeepSeek-V3 671B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 160000, + "output": 40000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "llama3.3:latest", + "name": "Llama 3.3 Latest", + "display_name": "Llama 3.3 Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "llama3.3:70b", + "name": "Llama 3.3 70B", + "display_name": "Llama 3.3 70B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "bge-m3:latest", + "name": "BGE-M3 Latest", + "display_name": "BGE-M3 Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 0 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "bge-m3:567m", + "name": "BGE-M3 567M", + "display_name": "BGE-M3 567M", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 0 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "llama3.2-vision:latest", + "name": "Llama 3.2 Vision Latest", + "display_name": "Llama 3.2 Vision Latest", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "llama3.2-vision:11b", + "name": "Llama 3.2 Vision 11B", + "display_name": "Llama 3.2 Vision 11B", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "llama3.2-vision:90b", + "name": "Llama 3.2 Vision 90B", + "display_name": "Llama 3.2 Vision 90B", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "tinyllama:latest", + "name": "TinyLlama Latest", + "display_name": "TinyLlama Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 2048, + "output": 512 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "tinyllama:1.1b", + "name": "TinyLlama 1.1B", + "display_name": "TinyLlama 1.1B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 2048, + "output": 512 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "starcoder2:latest", + "name": "StarCoder2 Latest", + "display_name": "StarCoder2 Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16384, + "output": 4096 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "starcoder2:3b", + "name": "StarCoder2 3B", + "display_name": "StarCoder2 3B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16384, + "output": 4096 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "starcoder2:7b", + "name": "StarCoder2 7B", + "display_name": "StarCoder2 7B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16384, + "output": 4096 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "starcoder2:15b", + "name": "StarCoder2 15B", + "display_name": "StarCoder2 15B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16384, + "output": 4096 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "codegemma:latest", + "name": "CodeGemma Latest", + "display_name": "CodeGemma Latest", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "codegemma:2b", + "name": "CodeGemma 2B", + "display_name": "CodeGemma 2B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "codegemma:7b", + "name": "CodeGemma 7B", + "display_name": "CodeGemma 7B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "glm-4.7", + "name": "glm-4.7", + "display_name": "glm-4.7", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 202752, + "output": 131072 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-22", + "last_updated": "2026-01-19" + }, + { + "id": "qwen3-next:80b", + "name": "qwen3-next:80b", + "display_name": "qwen3-next:80b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 32768 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-09-15", + "last_updated": "2026-01-19" + }, + { + "id": "cogito-2.1:671b", + "name": "cogito-2.1:671b", + "display_name": "cogito-2.1:671b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 163840, + "output": 32000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-11-19", + "last_updated": "2026-01-19" + }, + { + "id": "gemini-3-flash-preview", + "name": "gemini-3-flash-preview", + "display_name": "gemini-3-flash-preview", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2026-01-19" + }, + { + "id": "gemini-3-pro-preview", + "name": "gemini-3-pro-preview", + "display_name": "gemini-3-pro-preview", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 64000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-11-18", + "last_updated": "2026-01-19" + }, + { + "id": "qwen3-vl:235b-instruct", + "name": "qwen3-vl:235b-instruct", + "display_name": "qwen3-vl:235b-instruct", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 131072 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-09-22", + "last_updated": "2026-01-19" + }, + { + "id": "devstral-small-2:24b", + "name": "devstral-small-2:24b", + "display_name": "devstral-small-2:24b", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-12-09", + "last_updated": "2026-01-19" + }, + { + "id": "kimi-k2.5", + "name": "kimi-k2.5", + "display_name": "kimi-k2.5", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27" + }, + { + "id": "minimax-m2", + "name": "minimax-m2", + "display_name": "minimax-m2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-10-23", + "last_updated": "2026-01-19" + }, + { + "id": "kimi-k2-thinking", + "name": "kimi-k2-thinking", + "display_name": "kimi-k2-thinking", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2026-01-19" + }, + { + "id": "rnj-1:8b", + "name": "rnj-1:8b", + "display_name": "rnj-1:8b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32768, + "output": 4096 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-06", + "last_updated": "2026-01-19" + }, + { + "id": "glm-4.6", + "name": "glm-4.6", + "display_name": "glm-4.6", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 202752, + "output": 131072 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-09-29", + "last_updated": "2026-01-19" + }, + { + "id": "kimi-k2:1t", + "name": "kimi-k2:1t", + "display_name": "kimi-k2:1t", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-11", + "last_updated": "2026-01-19" + }, + { + "id": "devstral-2:123b", + "name": "devstral-2:123b", + "display_name": "devstral-2:123b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-09", + "last_updated": "2026-01-19" + }, + { + "id": "nemotron-3-nano:30b", + "name": "nemotron-3-nano:30b", + "display_name": "nemotron-3-nano:30b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 131072 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-15", + "last_updated": "2026-01-19" + }, + { + "id": "mistral-large-3:675b", + "name": "mistral-large-3:675b", + "display_name": "mistral-large-3:675b", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-12-02", + "last_updated": "2026-01-19" + }, + { + "id": "minimax-m2.1", + "name": "minimax-m2.1", + "display_name": "minimax-m2.1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2026-01-19" + }, + { + "id": "deepseek-v3.2", + "name": "deepseek-v3.2", + "display_name": "deepseek-v3.2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 163840, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-06-15", + "last_updated": "2026-01-19" + } + ] + }, + "burncloud": { + "id": "burncloud", + "name": "burncloud", + "display_name": "burncloud", + "models": [ + { + "id": "openai/gpt-4-turbo", + "name": "OpenAI GPT-4 Turbo", + "display_name": "GPT-4 Turbo", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 8, + "output": 24 + }, + "type": "chat" + }, + { + "id": "openai/o4-mini", + "name": "OpenAI o4-mini", + "display_name": "o4-mini", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "output": 100000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 0.88, + "output": 3.52 + }, + "type": "chat" + }, + { + "id": "openai/o3", + "name": "OpenAI o3", + "display_name": "o3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "output": 100000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 8, + "output": 35 + }, + "type": "chat" + }, + { + "id": "openai/o3-mini", + "name": "OpenAI o3-mini", + "display_name": "o3-mini", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "output": 100000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 0.88, + "output": 3.52 + }, + "type": "chat" + }, + { + "id": "openai/o1", + "name": "OpenAI o1", + "display_name": "o1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "output": 100000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 12, + "output": 48 + }, + "type": "chat" + }, + { + "id": "openai/o1-mini", + "name": "OpenAI o1-mini", + "display_name": "o1-mini", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 0.88, + "output": 3.52 + }, + "type": "chat" + }, + { + "id": "openai/o1-pro", + "name": "OpenAI o1-pro", + "display_name": "o1-pro", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "output": 100000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 120, + "output": 480 + }, + "type": "chat" + }, + { + "id": "openai/gpt-4.1", + "name": "OpenAI GPT-4.1", + "display_name": "GPT-4.1", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 1.6, + "output": 6.4 + }, + "type": "chat" + }, + { + "id": "openai/gpt-4o", + "name": "OpenAI GPT-4o", + "display_name": "GPT-4o", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 2, + "output": 8 + }, + "type": "chat" + }, + { + "id": "openai/gpt-4o-audio", + "name": "OpenAI GPT-4o Audio", + "display_name": "GPT-4o Audio", + "modalities": { + "input": [ + "text", + "audio" + ], + "output": [ + "text", + "audio" + ] + }, + "limit": { + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 2, + "output": 8 + }, + "type": "chat" + }, + { + "id": "openai/gpt-4o-mini", + "name": "OpenAI GPT-4o mini", + "display_name": "GPT-4o mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 0.12, + "output": 0.48 + }, + "type": "chat" + }, + { + "id": "openai/gpt-4o-mini-audio", + "name": "OpenAI GPT-4o mini Audio", + "display_name": "GPT-4o mini Audio", + "modalities": { + "input": [ + "text", + "audio" + ], + "output": [ + "text", + "audio" + ] + }, + "limit": { + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 0.12, + "output": 0.48 + }, + "type": "chat" + }, + { + "id": "openai/gpt-4o-realtime", + "name": "OpenAI GPT-4o Realtime", + "display_name": "GPT-4o Realtime", + "modalities": { + "input": [ + "text", + "audio" + ], + "output": [ + "text", + "audio" + ] + }, + "limit": { + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 4, + "output": 16 + }, + "type": "chat" + }, + { + "id": "openai/gpt-4o-mini-realtime", + "name": "OpenAI GPT-4o mini Realtime", + "display_name": "GPT-4o mini Realtime", + "modalities": { + "input": [ + "text", + "audio" + ], + "output": [ + "text", + "audio" + ] + }, + "limit": { + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 0.48, + "output": 1.92 + }, + "type": "chat" + }, + { + "id": "openai/gpt-image-1", + "name": "OpenAI GPT Image 1", + "display_name": "GPT Image 1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "cost": { + "input": 4, + "output": 32 + }, + "type": "imageGeneration" + }, + { + "id": "openai/gpt-4o-mini-tts", + "name": "OpenAI GPT-4o mini TTS", + "display_name": "GPT-4o mini TTS", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "cost": { + "input": 0.48, + "output": 0.96 + } + }, + { + "id": "openai/tts-1-hd", + "name": "OpenAI TTS-1 HD", + "display_name": "TTS-1 HD", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "cost": { + "input": 24 + } + }, + { + "id": "openai/gpt-4o-transcribe", + "name": "OpenAI GPT-4o Transcribe", + "display_name": "GPT-4o Transcribe", + "modalities": { + "input": [ + "audio" + ], + "output": [ + "text" + ] + }, + "limit": { + "output": 2000 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "cost": { + "input": 2, + "output": 8 + } + }, + { + "id": "openai/whisper", + "name": "OpenAI Whisper", + "display_name": "Whisper", + "modalities": { + "input": [ + "audio" + ], + "output": [ + "text" + ] + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "cost": { + "input": 0.0048 + } + }, + { + "id": "openai/gpt-4o-search-preview", + "name": "OpenAI GPT-4o Search Preview", + "display_name": "GPT-4o Search Preview", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 2, + "output": 8 + }, + "type": "chat" + }, + { + "id": "openai/computer-use-preview", + "name": "OpenAI Computer Use Preview", + "display_name": "computer-use-preview", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "output": 1024 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 2.4, + "output": 9.6 + }, + "type": "chat" + }, + { + "id": "google/gemini-2.5-pro", + "name": "Google Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 1, + "output": 8 + }, + "type": "chat" + }, + { + "id": "google/gemini-2.5-flash", + "name": "Google Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 0.12, + "output": 0.48 + }, + "type": "chat" + }, + { + "id": "google/gemini-2.0-flash", + "name": "Google Gemini 2.0 Flash", + "display_name": "Gemini 2.0 Flash", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 0.08, + "output": 0.32 + }, + "type": "chat" + }, + { + "id": "google/imagen-3", + "name": "Google Imagen 3", + "display_name": "Imagen 3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "cost": { + "input": 0.024 + }, + "type": "imageGeneration" + }, + { + "id": "google/veo-2", + "name": "Google Veo 2", + "display_name": "Veo 2", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "video" + ] + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "cost": { + "input": 0.28 + } + }, + { + "id": "anthropic/claude-sonnet-4", + "name": "Anthropic Claude Sonnet 4", + "display_name": "Claude Sonnet 4", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 200000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 2.4, + "output": 12 + }, + "type": "chat" + }, + { + "id": "anthropic/claude-opus-4", + "name": "Anthropic Claude Opus 4", + "display_name": "Claude Opus 4", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 12, + "output": 60 + }, + "type": "chat" + }, + { + "id": "anthropic/claude-3.7-sonnet", + "name": "Anthropic Claude 3.7 Sonnet", + "display_name": "Claude 3.7 Sonnet", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 200000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 2.4, + "output": 12 + }, + "type": "chat" + }, + { + "id": "anthropic/claude-3.5-haiku", + "name": "Anthropic Claude 3.5 Haiku", + "display_name": "Claude 3.5 Haiku", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 0.64, + "output": 3.2 + }, + "type": "chat" + }, + { + "id": "xai/grok-3", + "name": "xAI Grok-3", + "display_name": "Grok-3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 2.4, + "output": 12 + }, + "type": "chat" + }, + { + "id": "xai/grok-3-mini", + "name": "xAI Grok-3 Mini", + "display_name": "Grok-3 Mini", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 0.24, + "output": 0.4 + }, + "type": "chat" + }, + { + "id": "deepseek/deepseek-r1", + "name": "DeepSeek Reasoner", + "display_name": "DeepSeek R1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 0.1104, + "output": 1.7632 + }, + "type": "chat" + }, + { + "id": "deepseek/deepseek-chat", + "name": "DeepSeek Chat", + "display_name": "DeepSeek Chat", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "cost": { + "input": 0.0552, + "output": 0.8816 + }, + "type": "chat" + } + ] + }, + "cherryin": { + "id": "cherryin", + "name": "cherryin", + "display_name": "cherryin", + "models": [ + { + "id": "anthropic/claude-opus-4.5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 64000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "open_weights": false, + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5 + }, + "type": "chat" + }, + { + "id": "anthropic/claude-3.7-sonnet", + "name": "Anthropic: Claude 3.7 Sonnet", + "display_name": "Anthropic: Claude 3.7 Sonnet", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 64000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-01", + "release_date": "2025-02-19", + "last_updated": "2025-02-19" + }, + { + "id": "anthropic/claude-haiku-4.5", + "name": "Anthropic: claude-haiku-4-5", + "display_name": "Anthropic: claude-haiku-4-5", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false + }, + { + "id": "anthropic/claude-opus-4", + "name": "Anthropic: Claude Opus 4", + "display_name": "Anthropic: Claude Opus 4", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 32000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22" + }, + { + "id": "anthropic/claude-opus-4.1", + "name": "Anthropic: Claude Opus 4.1", + "display_name": "Anthropic: Claude Opus 4.1", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 32000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05" + }, + { + "id": "anthropic/claude-sonnet-4", + "name": "Anthropic: Claude Sonnet 4", + "display_name": "Anthropic: Claude Sonnet 4", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 64000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22" + }, + { + "id": "anthropic/claude-sonnet-4.5", + "name": "Anthropic: Claude Sonnet 4.5", + "display_name": "Anthropic: Claude Sonnet 4.5", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 64000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29" + }, + { + "id": "bytedance/seed-oss-36b-instruct", + "name": "ByteDance: Seed OSS 36B Instruct", + "display_name": "ByteDance: Seed OSS 36B Instruct", + "limit": { + "context": 4096, + "output": 4096 + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "deepseek/deepseek-r1-0528", + "name": "DeepSeek: R1 0528", + "display_name": "DeepSeek: R1 0528", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 163840, + "output": 163840 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false + }, + { + "id": "deepseek/deepseek-v3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2025-08-20", + "last_updated": "2025-08-26" + }, + { + "id": "deepseek/deepseek-v3.1-fast", + "name": "DeepSeek: DeepSeek V3.1 (free)", + "display_name": "DeepSeek: DeepSeek V3.1 (free)", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 163800 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false + }, + { + "id": "deepseek/deepseek-v3.1-terminus", + "name": "DeepSeek: DeepSeek V3.1 Terminus", + "display_name": "DeepSeek: DeepSeek V3.1 Terminus", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 163840, + "output": 163840 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-09-22", + "last_updated": "2025-09-22" + }, + { + "id": "deepseek/deepseek-v3.2-exp", + "name": "DeepSeek: DeepSeek V3.2 Exp", + "display_name": "DeepSeek: DeepSeek V3.2 Exp", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 163840 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false + }, + { + "id": "google/gemini-2.5-flash", + "name": "Google: Gemini 2.5 Flash", + "display_name": "Google: Gemini 2.5 Flash", + "modalities": { + "input": [ + "image", + "text", + "audio" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65535 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-07-17", + "last_updated": "2025-07-17" + }, + { + "id": "google/gemini-2.5-flash-image", + "name": "Google: Gemini 2.5 Flash Image (Nano Banana)", + "display_name": "Google: Gemini 2.5 Flash Image (Nano Banana)", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "image", + "text" + ] + }, + "limit": { + "context": 32768, + "output": 8192 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false + }, + { + "id": "google/gemini-2.5-flash-image-preview", + "name": "Google: Gemini 2.5 Flash Image Preview (Nano Banana)", + "display_name": "Google: Gemini 2.5 Flash Image Preview (Nano Banana)", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "image", + "text" + ] + }, + "limit": { + "context": 32768, + "output": 8192 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false + }, + { + "id": "google/gemini-2.5-flash-lite", + "name": "Google: Gemini 2.5 Flash Lite", + "display_name": "Google: Gemini 2.5 Flash Lite", + "modalities": { + "input": [ + "image", + "text", + "audio" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65535 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true + }, + { + "id": "google/gemini-2.5-pro", + "name": "Google: Gemini 2.5 Pro", + "display_name": "Google: Gemini 2.5 Pro", + "modalities": { + "input": [ + "image", + "text", + "audio" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05" + }, + { + "id": "google/gemini-3-pro-preview", + "name": "Google: Gemini 3 Pro Preview", + "display_name": "Google: Gemini 3 Pro Preview", + "modalities": { + "input": [ + "image", + "text", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-10", + "release_date": "2025-11-19", + "last_updated": "2025-11-19" + }, + { + "id": "inclusionai/ling-1t", + "name": "inclusionAI: Ling-1T", + "display_name": "inclusionAI: Ling-1T", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false + }, + { + "id": "meituan/longcat-flash-chat", + "name": "Meituan: LongCat-Flash-Chat", + "display_name": "Meituan: LongCat-Flash-Chat", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false + }, + { + "id": "minimax/minimax-m2", + "name": "MiniMax: minimax-m2", + "display_name": "MiniMax: minimax-m2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 192000 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false + }, + { + "id": "minimaxai/minimax-m1-80k", + "name": "MiniMax: MiniMax M1", + "display_name": "MiniMax: MiniMax M1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 40000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false + }, + { + "id": "moonshotai/kimi-k2-0905", + "name": "MoonshotAI: Kimi K2 0905", + "display_name": "MoonshotAI: Kimi K2 0905", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05" + }, + { + "id": "moonshotai/kimi-k2-thinking", + "name": "MoonshotAI: kimi-k2-thinking", + "display_name": "MoonshotAI: kimi-k2-thinking", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false + }, + { + "id": "moonshotai/kimi-k2-thinking-turbo", + "name": "MoonshotAI: kimi-k2-thinking", + "display_name": "MoonshotAI: kimi-k2-thinking", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false + }, + { + "id": "openai/gpt-4.1", + "name": "OpenAI: GPT-4.1", + "display_name": "OpenAI: GPT-4.1", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1047576, + "output": 32768 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14" + }, + { + "id": "openai/gpt-4.1-mini", + "name": "OpenAI: GPT-4.1 Mini", + "display_name": "OpenAI: GPT-4.1 Mini", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1047576, + "output": 32768 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14" + }, + { + "id": "openai/gpt-4.1-nano", + "name": "OpenAI: GPT-4.1 Nano", + "display_name": "OpenAI: GPT-4.1 Nano", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1047576, + "output": 32768 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true + }, + { + "id": "openai/gpt-4o", + "name": "OpenAI: gpt-4o", + "display_name": "OpenAI: gpt-4o", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false + }, + { + "id": "openai/gpt-4o-mini", + "name": "OpenAI: gpt-4o-mini", + "display_name": "OpenAI: gpt-4o-mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false + }, + { + "id": "openai/gpt-5", + "name": "OpenAI: GPT-5", + "display_name": "OpenAI: GPT-5", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-01", + "release_date": "2025-08-07", + "last_updated": "2025-08-07" + }, + { + "id": "openai/gpt-5-chat", + "name": "OpenAI: GPT-5 Chat", + "display_name": "OpenAI: GPT-5 Chat", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07" + }, + { + "id": "openai/gpt-5-mini", + "name": "OpenAI: GPT-5 Mini", + "display_name": "OpenAI: GPT-5 Mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-01", + "release_date": "2025-08-07", + "last_updated": "2025-08-07" + }, + { + "id": "openai/gpt-5-nano", + "name": "OpenAI: GPT-5 Nano", + "display_name": "OpenAI: GPT-5 Nano", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-01", + "release_date": "2025-08-07", + "last_updated": "2025-08-07" + }, + { + "id": "openai/gpt-5.1", + "name": "OpenAI: gpt-5.1", + "display_name": "OpenAI: gpt-5.1", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false + }, + { + "id": "openai/gpt-5.2", + "name": "OpenAI: gpt-5.2", + "display_name": "OpenAI: gpt-5.2", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false + }, + { + "id": "openai/gpt-5.1-chat", + "name": "OpenAI: gpt-5.1", + "display_name": "OpenAI: gpt-5.1", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false + }, + { + "id": "openai/gpt-image-1", + "name": "OpenAI: gpt-image-1", + "display_name": "OpenAI: gpt-image-1", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false + }, + { + "id": "openai/gpt-oss-120b", + "name": "OpenAI: gpt-oss-120b", + "display_name": "OpenAI: gpt-oss-120b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 131072 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05" + }, + { + "id": "openai/gpt-oss-20b", + "name": "OpenAI: gpt-oss-20b", + "display_name": "OpenAI: gpt-oss-20b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 32768 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05" + }, + { + "id": "openai/o1", + "name": "OpenAI: o1", + "display_name": "OpenAI: o1", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true + }, + { + "id": "openai/o1-mini", + "name": "OpenAI: o1-mini", + "display_name": "OpenAI: o1-mini", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 65536 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false + }, + { + "id": "openai/o3", + "name": "OpenAI: o3", + "display_name": "OpenAI: o3", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false + }, + { + "id": "openai/o4-mini", + "name": "OpenAI: o4 Mini", + "display_name": "OpenAI: o4 Mini", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2025-04-16", + "last_updated": "2025-04-16" + }, + { + "id": "qwen/qwen3-235b-a22b-instruct-2507", + "name": "Qwen: Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen: Qwen3 235B A22B Instruct 2507", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false + }, + { + "id": "qwen/qwen3-235b-a22b-thinking-2507", + "name": "Qwen: Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen: Qwen3 235B A22B Thinking 2507", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2025-07-25" + }, + { + "id": "qwen/qwen3-30b-a3b-instruct-2507", + "name": "Qwen: Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen: Qwen3 30B A3B Instruct 2507", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-29", + "last_updated": "2025-07-29" + }, + { + "id": "qwen/qwen3-30b-a3b-thinking-2507", + "name": "Qwen: Qwen3 30B A3B Thinking 2507", + "display_name": "Qwen: Qwen3 30B A3B Thinking 2507", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false + }, + { + "id": "qwen/qwen3-8b", + "name": "Qwen: Qwen3 8B", + "display_name": "Qwen: Qwen3 8B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 20000 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false + }, + { + "id": "qwen/qwen3-coder", + "name": "Qwen: Qwen3 Coder 480B A35B", + "display_name": "Qwen: Qwen3 Coder 480B A35B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23" + }, + { + "id": "qwen/qwen3-coder-30b-a3b-instruct", + "name": "Qwen: Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen: Qwen3 Coder 30B A3B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false + }, + { + "id": "qwen/qwen3-coder-480b-a35b-instruct", + "name": "Qwen: Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen: Qwen3 Coder 480B A35B Instruct", + "limit": { + "context": 4096, + "output": 4096 + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "qwen/qwen3-embedding-0.6b", + "name": "qwen/qwen3-embedding-0.6b", + "display_name": "qwen/qwen3-embedding-0.6b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "qwen/qwen3-embedding-4b", + "name": "qwen/qwen3-embedding-4b", + "display_name": "qwen/qwen3-embedding-4b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "qwen/qwen3-embedding-8b", + "name": "qwen/qwen3-embedding-8b", + "display_name": "qwen/qwen3-embedding-8b", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "qwen/qwen3-next-80b-a3b-instruct", + "name": "Qwen: Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen: Qwen3 Next 80B A3B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-11", + "last_updated": "2025-09-11" + }, + { + "id": "qwen/qwen3-next-80b-a3b-thinking", + "name": "Qwen: Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen: Qwen3 Next 80B A3B Thinking", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false + }, + { + "id": "qwen/qwen3-omni-30b-a3b-instruct", + "name": "Qwen: Qwen3 VL 30B A3B Instruct", + "display_name": "Qwen: Qwen3 VL 30B A3B Instruct", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false + }, + { + "id": "qwen/qwen3-omni-30b-a3b-thinking", + "name": "Qwen: Qwen3 VL 30B A3B Thinking", + "display_name": "Qwen: Qwen3 VL 30B A3B Thinking", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false + }, + { + "id": "qwen/qwen3-reranker-0.6b", + "name": "qwen/qwen3-reranker-0.6b", + "display_name": "qwen/qwen3-reranker-0.6b", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen/qwen3-reranker-4b", + "name": "qwen/qwen3-reranker-4b", + "display_name": "qwen/qwen3-reranker-4b", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen/qwen3-reranker-8b", + "name": "qwen/qwen3-reranker-8b", + "display_name": "qwen/qwen3-reranker-8b", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "qwen/qwen3-vl-235b-a22b-instruct", + "name": "Qwen: Qwen3 VL 235B A22B Instruct", + "display_name": "Qwen: Qwen3 VL 235B A22B Instruct", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false + }, + { + "id": "qwen/qwen3-vl-235b-a22b-thinking", + "name": "Qwen: Qwen3 VL 235B A22B Thinking", + "display_name": "Qwen: Qwen3 VL 235B A22B Thinking", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 65536, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false + }, + { + "id": "qwen/qwen3-vl-30b-a3b-instruct", + "name": "Qwen: Qwen3 VL 30B A3B Instruct", + "display_name": "Qwen: Qwen3 VL 30B A3B Instruct", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false + }, + { + "id": "qwen/qwen3-vl-30b-a3b-thinking", + "name": "Qwen: Qwen3 VL 30B A3B Thinking", + "display_name": "Qwen: Qwen3 VL 30B A3B Thinking", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 65536, - "output": 65536 + "context": 262144, + "output": 262144 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "attachment": false + }, + { + "id": "tencent/hunyuan-mt-7b", + "name": "Tencent: Hunyuan A13B Instruct", + "display_name": "Tencent: Hunyuan A13B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32768 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false + }, + { + "id": "x-ai/grok-2-image", + "name": "grok-2", + "display_name": "grok-2", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text", + "image" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, "type": "chat" }, { - "id": "qwen/qwen3-vl-235b-a22b-instruct", - "name": "Qwen3 VL 235B A22B Instruct", - "display_name": "Qwen3 VL 235B A22B Instruct", + "id": "x-ai/grok-3", + "name": "xAI: Grok 3", + "display_name": "xAI: Grok 3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, "limit": { "context": 131072, - "output": 32768 + "output": 8192 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17" }, { - "id": "qwen/qwen3-vl-235b-a22b-thinking", - "name": "Qwen3 VL 235B A22B Thinking", - "display_name": "Qwen3 VL 235B A22B Thinking", + "id": "x-ai/grok-3-mini", + "name": "xAI: Grok 3 Mini", + "display_name": "xAI: Grok 3 Mini", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, "limit": { "context": 131072, - "output": 32768 + "output": 8192 }, - "tool_call": false, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2025-02-17", + "last_updated": "2025-02-17" + }, + { + "id": "x-ai/grok-4", + "name": "xAI: Grok 4", + "display_name": "xAI: Grok 4", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 64000 + }, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-07-09", + "last_updated": "2025-07-09" + }, + { + "id": "x-ai/grok-4-fast-non-reasoning", + "name": "x-ai/grok-4-fast-non-reasoning", + "display_name": "x-ai/grok-4-fast-non-reasoning", + "limit": { + "context": 2000000, + "output": 2000000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-fp8", - "name": "Qwen3-235B-A22B", - "display_name": "Qwen3-235B-A22B", + "id": "x-ai/grok-4-fast-reasoning", + "name": "x-ai/grok-4-fast-reasoning", + "display_name": "x-ai/grok-4-fast-reasoning", "limit": { - "context": 40960, - "output": 20000 + "context": 2000000, + "output": 2000000 }, "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "x-ai/grok-code-fast-1", + "name": "xAI: Grok Code Fast 1", + "display_name": "xAI: Grok Code Fast 1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 10000 + }, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": false, + "open_weights": false, + "knowledge": "2025-08", + "release_date": "2025-08-26", + "last_updated": "2025-08-26" }, { - "id": "qwen/qwen3-30b-a3b-fp8", - "name": "Qwen3-30B-A3B", - "display_name": "Qwen3-30B-A3B", + "id": "z-ai/glm-4.5", + "name": "Z.AI: GLM 4.5", + "display_name": "Z.AI: GLM 4.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 128000, - "output": 20000 + "context": 131072, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28" + }, + { + "id": "z-ai/glm-4.5-flash", + "name": "z-ai/glm-4.5-flash", + "display_name": "z-ai/glm-4.5-flash", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, "type": "chat" }, { - "id": "xiaomimimo/mimo-v2-flash", - "name": "XiaomiMiMo/MiMo-V2-Flash", - "display_name": "XiaomiMiMo/MiMo-V2-Flash", + "id": "z-ai/glm-4.5v", + "name": "Z.AI: GLM 4.5V", + "display_name": "Z.AI: GLM 4.5V", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 262144, - "output": 32000 + "context": 65536, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11" }, { - "id": "zai-org/glm-4.5-air", - "name": "zai-org/glm-4.5-air", - "display_name": "zai-org/glm-4.5-air", + "id": "z-ai/glm-4.6", + "name": "Z.AI: GLM 4.6", + "display_name": "Z.AI: GLM 4.6", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 131072, - "output": 98304 + "context": 202752, + "output": 202752 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-09", + "release_date": "2025-09-30", + "last_updated": "2025-09-30" + }, + { + "id": "z-ai/glm-4.7", + "name": "Z.AI: GLM 4.7", + "display_name": "Z.AI: GLM 4.7", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 200000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "attachment": false, + "open_weights": true, + "cost": { + "input": 0.273974, + "output": 1.095896, + "cache_read": 0.054795 + }, "type": "chat" - } - ] - }, - "tokenflux": { - "id": "tokenflux", - "name": "Tokenflux", - "display_name": "Tokenflux", - "models": [ + }, { - "id": "anthropic/claude-3-haiku", - "name": "anthropic/claude-3-haiku", - "display_name": "anthropic/claude-3-haiku", + "id": "xiaomi/mimo-v2-flash", + "name": "Xiaomi: Mimo V2 Flash", + "display_name": "Xiaomi: Mimo V2 Flash", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 4096, - "output": 4096 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, + "attachment": false, + "open_weights": false, + "cost": { + "input": 0.1918, + "output": 0.5754, + "cache_read": 0.03836 + }, "type": "chat" }, { - "id": "anthropic/claude-3.5-haiku", - "name": "anthropic/claude-3.5-haiku", - "display_name": "anthropic/claude-3.5-haiku", + "id": "xiaomimimo/mimo-v2-flash", + "name": "Xiaomi: Mimo V2 Flash", + "display_name": "Xiaomi: Mimo V2 Flash", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 4096, - "output": 4096 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, + "attachment": false, + "open_weights": false, + "cost": { + "input": 0.1918, + "output": 0.5754, + "cache_read": 0.03836 + }, "type": "chat" }, { - "id": "anthropic/claude-3.5-haiku-20241022", - "name": "anthropic/claude-3.5-haiku-20241022", - "display_name": "anthropic/claude-3.5-haiku-20241022", + "id": "minimax/minimax-m2.1", + "name": "MiniMax: minimax-m2.1", + "display_name": "MiniMax: minimax-m2.1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 4096, - "output": 4096 + "context": 204800, + "output": 204800 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, + "attachment": false, + "open_weights": false, + "cost": { + "input": 0.288, + "output": 1.152 + }, "type": "chat" }, { - "id": "anthropic/claude-3.5-sonnet", - "name": "anthropic/claude-3.5-sonnet", - "display_name": "anthropic/claude-3.5-sonnet", + "id": "minimax/minimax-m2.1-lightning", + "name": "MiniMax: minimax-m2.1-lightning", + "display_name": "MiniMax: minimax-m2.1-lightning", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 4096, - "output": 4096 + "context": 204800, + "output": 204800 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, + "attachment": false, + "open_weights": false, + "cost": { + "input": 0.144, + "output": 0.576 + }, + "type": "chat" + } + ] + }, + "doubao": { + "id": "doubao", + "name": "Doubao", + "display_name": "Doubao", + "models": [ + { + "id": "deepseek-v3-1-250821", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", + "limit": { + "context": 128000, + "output": 32000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, "type": "chat" }, { - "id": "anthropic/claude-3.7-sonnet", - "name": "anthropic/claude-3.7-sonnet", - "display_name": "anthropic/claude-3.7-sonnet", + "id": "deepseek-r1-250120", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", "limit": { - "context": 4096, + "context": 64000, "output": 4096 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "anthropic/claude-haiku-4.5", - "name": "anthropic/claude-haiku-4.5", - "display_name": "anthropic/claude-haiku-4.5", + "id": "deepseek-r1-distill-qwen-32b-250120", + "name": "DeepSeek R1 Distill Qwen 32B", + "display_name": "DeepSeek R1 Distill Qwen 32B", "limit": { - "context": 4096, + "context": 32000, "output": 4096 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "anthropic/claude-opus-4", - "name": "anthropic/claude-opus-4", - "display_name": "anthropic/claude-opus-4", + "id": "deepseek-r1-distill-qwen-7b-250120", + "name": "DeepSeek R1 Distill Qwen 7B", + "display_name": "DeepSeek R1 Distill Qwen 7B", "limit": { - "context": 4096, + "context": 32000, "output": 4096 }, "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "deepseek-v3-250324", + "name": "DeepSeek V3", + "display_name": "DeepSeek V3", + "limit": { + "context": 64000, + "output": 4096 + }, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.1", - "name": "anthropic/claude-opus-4.1", - "display_name": "anthropic/claude-opus-4.1", + "id": "doubao-seed-1-6-vision-250815", + "name": "Doubao Seed 1.6 Vision", + "display_name": "Doubao Seed 1.6 Vision", + "limit": { + "context": 256000, + "output": 32000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "doubao-seed-1-6-250615", + "name": "Doubao Seed 1.6", + "display_name": "Doubao Seed 1.6", + "limit": { + "context": 256000, + "output": 32000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "doubao-seed-1-6-flash-250715", + "name": "Doubao Seed 1.6 Flash", + "display_name": "Doubao Seed 1.6 Flash", "limit": { - "context": 4096, - "output": 4096 + "context": 256000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.5", - "name": "anthropic/claude-opus-4.5", - "display_name": "anthropic/claude-opus-4.5", + "id": "doubao-seed-1-6-flash-250615", + "name": "Doubao Seed 1.6 Flash (250615)", + "display_name": "Doubao Seed 1.6 Flash (250615)", "limit": { - "context": 4096, - "output": 4096 + "context": 256000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4", - "name": "anthropic/claude-sonnet-4", - "display_name": "anthropic/claude-sonnet-4", + "id": "doubao-seed-1-6-thinking-250715", + "name": "Doubao Seed 1.6 Thinking", + "display_name": "Doubao Seed 1.6 Thinking", "limit": { - "context": 4096, - "output": 4096 + "context": 256000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.5", - "name": "anthropic/claude-sonnet-4.5", - "display_name": "anthropic/claude-sonnet-4.5", + "id": "doubao-seed-1-6-thinking-250615", + "name": "Doubao Seed 1.6 Thinking (250615)", + "display_name": "Doubao Seed 1.6 Thinking (250615)", "limit": { - "context": 4096, - "output": 4096 + "context": 256000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" - }, + } + ] + }, + "ppinfra": { + "id": "ppinfra", + "name": "PPInfra", + "display_name": "PPInfra", + "models": [ { - "id": "deepseek/deepseek-chat", - "name": "deepseek/deepseek-chat", - "display_name": "deepseek/deepseek-chat", + "id": "zai-org/autoglm-phone-9b-multilingual", + "name": "AutoGLM-Phone-9B-Multilingual", + "display_name": "AutoGLM-Phone-9B-Multilingual", "limit": { - "context": 4096, - "output": 4096 + "context": 65536, + "output": 32000 }, "tool_call": false, "reasoning": { @@ -69929,12 +81526,12 @@ "type": "chat" }, { - "id": "deepseek/deepseek-chat-v3-0324", - "name": "deepseek/deepseek-chat-v3-0324", - "display_name": "deepseek/deepseek-chat-v3-0324", + "id": "deepseek/deepseek-prover-v2-671b", + "name": "Deepseek Prover V2 671B", + "display_name": "Deepseek Prover V2 671B", "limit": { - "context": 4096, - "output": 4096 + "context": 160000, + "output": 160000 }, "tool_call": false, "reasoning": { @@ -69943,152 +81540,159 @@ "type": "chat" }, { - "id": "deepseek/deepseek-chat-v3.1", - "name": "deepseek/deepseek-chat-v3.1", - "display_name": "deepseek/deepseek-chat-v3.1", + "id": "deepseek/deepseek-r1/community", + "name": "DeepSeek R1 (Community)", + "display_name": "DeepSeek R1 (Community)", "limit": { - "context": 4096, - "output": 4096 + "context": 64000, + "output": 4000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "deepseek/deepseek-prover-v2", - "name": "deepseek/deepseek-prover-v2", - "display_name": "deepseek/deepseek-prover-v2", + "id": "deepseek/deepseek-r1-turbo", + "name": "DeepSeek R1 (Turbo)", + "display_name": "DeepSeek R1 (Turbo)", "limit": { - "context": 4096, - "output": 4096 + "context": 64000, + "output": 16000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "deepseek/deepseek-r1", - "name": "deepseek/deepseek-r1", - "display_name": "deepseek/deepseek-r1", + "id": "deepseek/deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "limit": { - "context": 4096, - "output": 4096 + "context": 32000, + "output": 8000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-0528", - "name": "deepseek/deepseek-r1-0528", - "display_name": "deepseek/deepseek-r1-0528", + "id": "deepseek/deepseek-v3/community", + "name": "DeepSeek V3 (Community)", + "display_name": "DeepSeek V3 (Community)", "limit": { - "context": 4096, - "output": 4096 + "context": 64000, + "output": 4000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-0528-qwen3-8b", - "name": "deepseek/deepseek-r1-0528-qwen3-8b", - "display_name": "deepseek/deepseek-r1-0528-qwen3-8b", + "id": "deepseek/deepseek-v3-turbo", + "name": "DeepSeek V3 (Turbo)", + "display_name": "DeepSeek V3 (Turbo)", "limit": { - "context": 4096, - "output": 4096 + "context": 64000, + "output": 16000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.1-terminus", - "name": "deepseek/deepseek-v3.1-terminus", - "display_name": "deepseek/deepseek-v3.1-terminus", + "id": "deepseek/deepseek-v3-0324", + "name": "DeepSeek V3 0324", + "display_name": "DeepSeek V3 0324", "limit": { - "context": 4096, - "output": 4096 + "context": 163840, + "output": 163840 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2", - "name": "deepseek/deepseek-v3.2", - "display_name": "deepseek/deepseek-v3.2", + "id": "deepseek/deepseek-v3.1", + "name": "Deepseek V3.1", + "display_name": "Deepseek V3.1", "limit": { - "context": 4096, - "output": 4096 + "context": 131072, + "output": 32768 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-exp", - "name": "deepseek/deepseek-v3.2-exp", - "display_name": "deepseek/deepseek-v3.2-exp", + "id": "deepseek/deepseek-v3.1-terminus", + "name": "Deepseek V3.1 Terminus", + "display_name": "Deepseek V3.1 Terminus", "limit": { - "context": 4096, - "output": 4096 + "context": 131072, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-speciale", - "name": "deepseek/deepseek-v3.2-speciale", - "display_name": "deepseek/deepseek-v3.2-speciale", + "id": "deepseek/deepseek-v3.2", + "name": "Deepseek V3.2", + "display_name": "Deepseek V3.2", "limit": { - "context": 4096, - "output": 4096 + "context": 163840, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "google/gemini-2.0-flash-001", - "name": "google/gemini-2.0-flash-001", - "display_name": "google/gemini-2.0-flash-001", + "id": "deepseek/deepseek-v3.2-exp", + "name": "Deepseek V3.2 Exp", + "display_name": "Deepseek V3.2 Exp", "limit": { - "context": 4096, - "output": 4096 + "context": 163840, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "google/gemini-2.0-flash-lite-001", - "name": "google/gemini-2.0-flash-lite-001", - "display_name": "google/gemini-2.0-flash-lite-001", + "id": "deepseek/deepseek-ocr-2", + "name": "DeepSeek-OCR 2", + "display_name": "DeepSeek-OCR 2", "limit": { - "context": 4096, - "output": 4096 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -70097,404 +81701,420 @@ "type": "chat" }, { - "id": "google/gemini-2.5-flash", - "name": "google/gemini-2.5-flash", - "display_name": "google/gemini-2.5-flash", + "id": "deepseek/deepseek-r1-0528", + "name": "deepseek/deepseek-r1-0528", + "display_name": "deepseek/deepseek-r1-0528", "limit": { - "context": 4096, - "output": 4096 + "context": 163840, + "output": 32768 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-image", - "name": "google/gemini-2.5-flash-image", - "display_name": "google/gemini-2.5-flash-image", + "id": "baidu/ernie-4.5-21b-a3b-thinking", + "name": "Ernie 4.5 21B A3B Thinking", + "display_name": "Ernie 4.5 21B A3B Thinking", "limit": { - "context": 4096, - "output": 4096 + "context": 131072, + "output": 65536 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-image-preview", - "name": "google/gemini-2.5-flash-image-preview", - "display_name": "google/gemini-2.5-flash-image-preview", + "id": "baidu/ernie-4.5-0.3b", + "name": "ERNIE-4.5-0.3B", + "display_name": "ERNIE-4.5-0.3B", "limit": { - "context": 4096, - "output": 4096 + "context": 120000, + "output": 8000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-lite", - "name": "google/gemini-2.5-flash-lite", - "display_name": "google/gemini-2.5-flash-lite", + "id": "baidu/ernie-4.5-21B-a3b", + "name": "ERNIE-4.5-21B-A3B", + "display_name": "ERNIE-4.5-21B-A3B", "limit": { - "context": 4096, - "output": 4096 + "context": 120000, + "output": 8000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-lite-preview-09-2025", - "name": "google/gemini-2.5-flash-lite-preview-09-2025", - "display_name": "google/gemini-2.5-flash-lite-preview-09-2025", + "id": "baidu/ernie-4.5-300b-a47b-paddle", + "name": "ERNIE-4.5-300B-A47B", + "display_name": "ERNIE-4.5-300B-A47B", "limit": { - "context": 4096, - "output": 4096 + "context": 123000, + "output": 12000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-preview-09-2025", - "name": "google/gemini-2.5-flash-preview-09-2025", - "display_name": "google/gemini-2.5-flash-preview-09-2025", + "id": "baidu/ernie-4.5-vl-28b-a3b", + "name": "ERNIE-4.5-VL-28B-A3B", + "display_name": "ERNIE-4.5-VL-28B-A3B", "limit": { - "context": 4096, - "output": 4096 + "context": 30000, + "output": 8000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "google/gemini-2.5-pro", - "name": "google/gemini-2.5-pro", - "display_name": "google/gemini-2.5-pro", + "id": "baidu/ernie-4.5-vl-424b-a47b", + "name": "ERNIE-4.5-VL-424B-A47B", + "display_name": "ERNIE-4.5-VL-424B-A47B", "limit": { - "context": 4096, - "output": 4096 + "context": 123000, + "output": 16000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "google/gemini-2.5-pro-preview", - "name": "google/gemini-2.5-pro-preview", - "display_name": "google/gemini-2.5-pro-preview", + "id": "zai-org/glm-4.5v", + "name": "GLM 4.5V", + "display_name": "GLM 4.5V", "limit": { - "context": 4096, - "output": 4096 + "context": 65536, + "output": 16384 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "google/gemini-2.5-pro-preview-05-06", - "name": "google/gemini-2.5-pro-preview-05-06", - "display_name": "google/gemini-2.5-pro-preview-05-06", + "id": "zai-org/glm-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "limit": { - "context": 4096, - "output": 4096 + "context": 204800, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "google/gemini-3-flash-preview", - "name": "google/gemini-3-flash-preview", - "display_name": "google/gemini-3-flash-preview", + "id": "zai-org/glm-4.6v", + "name": "GLM 4.6v", + "display_name": "GLM 4.6v", "limit": { - "context": 4096, - "output": 4096 + "context": 131072, + "output": 32768 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "google/gemini-3-pro-image-preview", - "name": "google/gemini-3-pro-image-preview", - "display_name": "google/gemini-3-pro-image-preview", + "id": "zai-org/glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "limit": { - "context": 4096, - "output": 4096 + "context": 131072, + "output": 98304 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "google/gemini-3-pro-preview", - "name": "google/gemini-3-pro-preview", - "display_name": "google/gemini-3-pro-preview", + "id": "zai-org/glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "limit": { - "context": 4096, - "output": 4096 + "context": 204800, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "google/gemma-2-27b-it", - "name": "google/gemma-2-27b-it", - "display_name": "google/gemma-2-27b-it", + "id": "zai-org/glm-4.7-flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "limit": { - "context": 4096, - "output": 4096 + "context": 200000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "google/gemma-2-9b-it", - "name": "google/gemma-2-9b-it", - "display_name": "google/gemma-2-9b-it", + "id": "kat-coder", + "name": "KAT Coder Pro V1", + "display_name": "KAT Coder Pro V1", "limit": { - "context": 4096, - "output": 4096 + "context": 256000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "google/gemma-3-12b-it", - "name": "google/gemma-3-12b-it", - "display_name": "google/gemma-3-12b-it", + "id": "moonshotai/kimi-k2-0905", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "limit": { - "context": 4096, - "output": 4096 + "context": 262144, + "output": 262144 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "google/gemma-3-27b-it", - "name": "google/gemma-3-27b-it", - "display_name": "google/gemma-3-27b-it", + "id": "moonshotai/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "limit": { - "context": 4096, - "output": 4096 + "context": 131072, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "google/gemma-3-4b-it", - "name": "google/gemma-3-4b-it", - "display_name": "google/gemma-3-4b-it", + "id": "moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "limit": { - "context": 4096, - "output": 4096 + "context": 262144, + "output": 262144 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "google/gemma-3n-e4b-it", - "name": "google/gemma-3n-e4b-it", - "display_name": "google/gemma-3n-e4b-it", + "id": "moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "limit": { - "context": 4096, - "output": 4096 + "context": 262144, + "output": 262144 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "minimax/minimax-01", - "name": "minimax/minimax-01", - "display_name": "minimax/minimax-01", + "id": "minimax/minimax-m2.1", + "name": "MiniMax M2.1", + "display_name": "MiniMax M2.1", "limit": { - "context": 4096, - "output": 4096 + "context": 204800, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "minimax/minimax-m1", - "name": "minimax/minimax-m1", - "display_name": "minimax/minimax-m1", + "id": "minimax/minimax-m2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "limit": { - "context": 4096, - "output": 4096 + "context": 204800, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "minimax/minimax-m2", - "name": "minimax/minimax-m2", - "display_name": "minimax/minimax-m2", + "id": "minimaxai/minimax-m1-80k", + "name": "MiniMaxAI/MiniMax-M1-80k", + "display_name": "MiniMaxAI/MiniMax-M1-80k", "limit": { - "context": 4096, - "output": 4096 + "context": 128000, + "output": 40000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "minimax/minimax-m2.1", - "name": "minimax/minimax-m2.1", - "display_name": "minimax/minimax-m2.1", + "id": "qwen/qwen2.5-7b-instruct", + "name": "Qwen 2.5 7B Instruct", + "display_name": "Qwen 2.5 7B Instruct", "limit": { - "context": 4096, - "output": 4096 + "context": 32000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "moonshotai/kimi-dev-72b", - "name": "moonshotai/kimi-dev-72b", - "display_name": "moonshotai/kimi-dev-72b", + "id": "qwen/qwen3-omni-30b-a3b-instruct", + "name": "qwen/qwen3-omni-30b-a3b-instruct", + "display_name": "qwen/qwen3-omni-30b-a3b-instruct", "limit": { - "context": 4096, - "output": 4096 + "context": 65536, + "output": 16384 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "moonshotai/kimi-k2", - "name": "moonshotai/kimi-k2", - "display_name": "moonshotai/kimi-k2", + "id": "qwen/qwen3-omni-30b-a3b-thinking", + "name": "qwen/qwen3-omni-30b-a3b-thinking", + "display_name": "qwen/qwen3-omni-30b-a3b-thinking", "limit": { - "context": 4096, - "output": 4096 + "context": 65536, + "output": 16384 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-0905", - "name": "moonshotai/kimi-k2-0905", - "display_name": "moonshotai/kimi-k2-0905", + "id": "qwen/qwen3-vl-30b-a3b-instruct", + "name": "qwen/qwen3-vl-30b-a3b-instruct", + "display_name": "qwen/qwen3-vl-30b-a3b-instruct", "limit": { - "context": 4096, - "output": 4096 + "context": 131072, + "output": 32768 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking", - "name": "moonshotai/kimi-k2-thinking", - "display_name": "moonshotai/kimi-k2-thinking", + "id": "qwen/qwen3-vl-30b-a3b-thinking", + "name": "qwen/qwen3-vl-30b-a3b-thinking", + "display_name": "qwen/qwen3-vl-30b-a3b-thinking", "limit": { - "context": 4096, - "output": 4096 + "context": 131072, + "output": 32768 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "morph/morph-v3-fast", - "name": "morph/morph-v3-fast", - "display_name": "morph/morph-v3-fast", + "id": "qwen/qwen3-vl-8b-instruct", + "name": "qwen/qwen3-vl-8b-instruct", + "display_name": "qwen/qwen3-vl-8b-instruct", "limit": { - "context": 4096, - "output": 4096 + "context": 131072, + "output": 32768 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "morph/morph-v3-large", - "name": "morph/morph-v3-large", - "display_name": "morph/morph-v3-large", + "id": "qwen/qwen-2.5-72b-instruct", + "name": "Qwen2.5 72B Instruct", + "display_name": "Qwen2.5 72B Instruct", "limit": { - "context": 4096, - "output": 4096 + "context": 32000, + "output": 16000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "openai/chatgpt-4o-latest", - "name": "openai/chatgpt-4o-latest", - "display_name": "openai/chatgpt-4o-latest", + "id": "qwen/qwen2.5-vl-72b-instruct", + "name": "Qwen2.5 VL 72B Instruct", + "display_name": "Qwen2.5 VL 72B Instruct", "limit": { - "context": 4096, - "output": 4096 + "context": 32000, + "output": 32000 }, "tool_call": false, "reasoning": { @@ -70503,219 +82123,235 @@ "type": "chat" }, { - "id": "openai/codex-mini", - "name": "openai/codex-mini", - "display_name": "openai/codex-mini", + "id": "qwen/qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "limit": { - "context": 4096, - "output": 4096 + "context": 262144, + "output": 260000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo", - "name": "openai/gpt-3.5-turbo", - "display_name": "openai/gpt-3.5-turbo", + "id": "qwen/qwen3-235b-a22b-thinking-2507", + "name": "Qwen3 235B A22b Thinking 2507", + "display_name": "Qwen3 235B A22b Thinking 2507", "limit": { - "context": 4096, - "output": 4096 + "context": 131072, + "output": 114688 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo-0613", - "name": "openai/gpt-3.5-turbo-0613", - "display_name": "openai/gpt-3.5-turbo-0613", + "id": "qwen/qwen3-32b-fp8", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "limit": { - "context": 4096, - "output": 4096 + "context": 128000, + "output": 20000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo-16k", - "name": "openai/gpt-3.5-turbo-16k", - "display_name": "openai/gpt-3.5-turbo-16k", + "id": "qwen/qwen3-4b-fp8", + "name": "Qwen3 4B", + "display_name": "Qwen3 4B", "limit": { - "context": 4096, - "output": 4096 + "context": 128000, + "output": 20000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo-instruct", - "name": "openai/gpt-3.5-turbo-instruct", - "display_name": "openai/gpt-3.5-turbo-instruct", + "id": "qwen/qwen3-coder-30b-a3b-instruct", + "name": "Qwen3 Coder 30b A3B Instruct", + "display_name": "Qwen3 Coder 30b A3B Instruct", "limit": { - "context": 4096, - "output": 4096 + "context": 262144, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "openai/gpt-4", - "name": "openai/gpt-4", - "display_name": "openai/gpt-4", + "id": "qwen/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "limit": { - "context": 4096, - "output": 4096 + "context": 262144, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "openai/gpt-4-0314", - "name": "openai/gpt-4-0314", - "display_name": "openai/gpt-4-0314", + "id": "qwen/qwen3-coder-next", + "name": "Qwen3 Coder Next", + "display_name": "Qwen3 Coder Next", "limit": { - "context": 4096, - "output": 4096 + "context": 262144, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "openai/gpt-4-1106-preview", - "name": "openai/gpt-4-1106-preview", - "display_name": "openai/gpt-4-1106-preview", + "id": "qwen/qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "limit": { - "context": 4096, - "output": 4096 + "context": 65536, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "openai/gpt-4-turbo", - "name": "openai/gpt-4-turbo", - "display_name": "openai/gpt-4-turbo", + "id": "qwen/qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen3 Next 80B A3B Thinking", "limit": { - "context": 4096, - "output": 4096 + "context": 65536, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "openai/gpt-4-turbo-preview", - "name": "openai/gpt-4-turbo-preview", - "display_name": "openai/gpt-4-turbo-preview", + "id": "qwen/qwen3-vl-235b-a22b-instruct", + "name": "Qwen3 VL 235B A22B Instruct", + "display_name": "Qwen3 VL 235B A22B Instruct", "limit": { - "context": 4096, - "output": 4096 + "context": 131072, + "output": 32768 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "openai/gpt-4.1", - "name": "openai/gpt-4.1", - "display_name": "openai/gpt-4.1", + "id": "qwen/qwen3-vl-235b-a22b-thinking", + "name": "Qwen3 VL 235B A22B Thinking", + "display_name": "Qwen3 VL 235B A22B Thinking", "limit": { - "context": 4096, - "output": 4096 + "context": 131072, + "output": 32768 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "openai/gpt-4.1-mini", - "name": "openai/gpt-4.1-mini", - "display_name": "openai/gpt-4.1-mini", + "id": "qwen/qwen3-235b-a22b-fp8", + "name": "Qwen3-235B-A22B", + "display_name": "Qwen3-235B-A22B", "limit": { - "context": 4096, - "output": 4096 + "context": 40960, + "output": 20000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "openai/gpt-4.1-nano", - "name": "openai/gpt-4.1-nano", - "display_name": "openai/gpt-4.1-nano", + "id": "qwen/qwen3-30b-a3b-fp8", + "name": "Qwen3-30B-A3B", + "display_name": "Qwen3-30B-A3B", "limit": { - "context": 4096, - "output": 4096 + "context": 128000, + "output": 20000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "openai/gpt-4o", - "name": "openai/gpt-4o", - "display_name": "openai/gpt-4o", + "id": "xiaomimimo/mimo-v2-flash", + "name": "XiaomiMiMo/MiMo-V2-Flash", + "display_name": "XiaomiMiMo/MiMo-V2-Flash", "limit": { - "context": 4096, - "output": 4096 + "context": 262144, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "openai/gpt-4o-2024-05-13", - "name": "openai/gpt-4o-2024-05-13", - "display_name": "openai/gpt-4o-2024-05-13", + "id": "zai-org/glm-4.5-air", + "name": "zai-org/glm-4.5-air", + "display_name": "zai-org/glm-4.5-air", "limit": { - "context": 4096, - "output": 4096 + "context": 131072, + "output": 98304 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" - }, + } + ] + }, + "tokenflux": { + "id": "tokenflux", + "name": "Tokenflux", + "display_name": "Tokenflux", + "models": [ { - "id": "openai/gpt-4o-2024-08-06", - "name": "openai/gpt-4o-2024-08-06", - "display_name": "openai/gpt-4o-2024-08-06", + "id": "anthropic/claude-3-haiku", + "name": "anthropic/claude-3-haiku", + "display_name": "anthropic/claude-3-haiku", "limit": { "context": 4096, "output": 4096 @@ -70727,9 +82363,9 @@ "type": "chat" }, { - "id": "openai/gpt-4o-2024-11-20", - "name": "openai/gpt-4o-2024-11-20", - "display_name": "openai/gpt-4o-2024-11-20", + "id": "anthropic/claude-3.5-haiku", + "name": "anthropic/claude-3.5-haiku", + "display_name": "anthropic/claude-3.5-haiku", "limit": { "context": 4096, "output": 4096 @@ -70741,9 +82377,9 @@ "type": "chat" }, { - "id": "openai/gpt-4o-audio-preview", - "name": "openai/gpt-4o-audio-preview", - "display_name": "openai/gpt-4o-audio-preview", + "id": "anthropic/claude-3.5-sonnet", + "name": "anthropic/claude-3.5-sonnet", + "display_name": "anthropic/claude-3.5-sonnet", "limit": { "context": 4096, "output": 4096 @@ -70755,9 +82391,9 @@ "type": "chat" }, { - "id": "openai/gpt-4o-mini", - "name": "openai/gpt-4o-mini", - "display_name": "openai/gpt-4o-mini", + "id": "anthropic/claude-3.7-sonnet", + "name": "anthropic/claude-3.7-sonnet", + "display_name": "anthropic/claude-3.7-sonnet", "limit": { "context": 4096, "output": 4096 @@ -70769,9 +82405,9 @@ "type": "chat" }, { - "id": "openai/gpt-4o-mini-2024-07-18", - "name": "openai/gpt-4o-mini-2024-07-18", - "display_name": "openai/gpt-4o-mini-2024-07-18", + "id": "anthropic/claude-haiku-4.5", + "name": "anthropic/claude-haiku-4.5", + "display_name": "anthropic/claude-haiku-4.5", "limit": { "context": 4096, "output": 4096 @@ -70783,9 +82419,9 @@ "type": "chat" }, { - "id": "openai/gpt-4o-mini-search-preview", - "name": "openai/gpt-4o-mini-search-preview", - "display_name": "openai/gpt-4o-mini-search-preview", + "id": "anthropic/claude-opus-4", + "name": "anthropic/claude-opus-4", + "display_name": "anthropic/claude-opus-4", "limit": { "context": 4096, "output": 4096 @@ -70797,9 +82433,9 @@ "type": "chat" }, { - "id": "openai/gpt-4o-search-preview", - "name": "openai/gpt-4o-search-preview", - "display_name": "openai/gpt-4o-search-preview", + "id": "anthropic/claude-opus-4.1", + "name": "anthropic/claude-opus-4.1", + "display_name": "anthropic/claude-opus-4.1", "limit": { "context": 4096, "output": 4096 @@ -70811,9 +82447,9 @@ "type": "chat" }, { - "id": "openai/gpt-5", - "name": "openai/gpt-5", - "display_name": "openai/gpt-5", + "id": "anthropic/claude-opus-4.5", + "name": "anthropic/claude-opus-4.5", + "display_name": "anthropic/claude-opus-4.5", "limit": { "context": 4096, "output": 4096 @@ -70825,9 +82461,9 @@ "type": "chat" }, { - "id": "openai/gpt-5-chat", - "name": "openai/gpt-5-chat", - "display_name": "openai/gpt-5-chat", + "id": "anthropic/claude-sonnet-4", + "name": "anthropic/claude-sonnet-4", + "display_name": "anthropic/claude-sonnet-4", "limit": { "context": 4096, "output": 4096 @@ -70839,9 +82475,9 @@ "type": "chat" }, { - "id": "openai/gpt-5-codex", - "name": "openai/gpt-5-codex", - "display_name": "openai/gpt-5-codex", + "id": "anthropic/claude-sonnet-4.5", + "name": "anthropic/claude-sonnet-4.5", + "display_name": "anthropic/claude-sonnet-4.5", "limit": { "context": 4096, "output": 4096 @@ -70853,9 +82489,9 @@ "type": "chat" }, { - "id": "openai/gpt-5-image", - "name": "openai/gpt-5-image", - "display_name": "openai/gpt-5-image", + "id": "deepseek/deepseek-chat", + "name": "deepseek/deepseek-chat", + "display_name": "deepseek/deepseek-chat", "limit": { "context": 4096, "output": 4096 @@ -70867,9 +82503,9 @@ "type": "chat" }, { - "id": "openai/gpt-5-image-mini", - "name": "openai/gpt-5-image-mini", - "display_name": "openai/gpt-5-image-mini", + "id": "deepseek/deepseek-chat-v3-0324", + "name": "deepseek/deepseek-chat-v3-0324", + "display_name": "deepseek/deepseek-chat-v3-0324", "limit": { "context": 4096, "output": 4096 @@ -70881,9 +82517,9 @@ "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "openai/gpt-5-mini", - "display_name": "openai/gpt-5-mini", + "id": "deepseek/deepseek-chat-v3.1", + "name": "deepseek/deepseek-chat-v3.1", + "display_name": "deepseek/deepseek-chat-v3.1", "limit": { "context": 4096, "output": 4096 @@ -70895,9 +82531,9 @@ "type": "chat" }, { - "id": "openai/gpt-5-nano", - "name": "openai/gpt-5-nano", - "display_name": "openai/gpt-5-nano", + "id": "deepseek/deepseek-r1", + "name": "deepseek/deepseek-r1", + "display_name": "deepseek/deepseek-r1", "limit": { "context": 4096, "output": 4096 @@ -70909,9 +82545,9 @@ "type": "chat" }, { - "id": "openai/gpt-5-pro", - "name": "openai/gpt-5-pro", - "display_name": "openai/gpt-5-pro", + "id": "deepseek/deepseek-r1-0528", + "name": "deepseek/deepseek-r1-0528", + "display_name": "deepseek/deepseek-r1-0528", "limit": { "context": 4096, "output": 4096 @@ -70923,9 +82559,9 @@ "type": "chat" }, { - "id": "openai/gpt-5.1", - "name": "openai/gpt-5.1", - "display_name": "openai/gpt-5.1", + "id": "deepseek/deepseek-v3.1-terminus", + "name": "deepseek/deepseek-v3.1-terminus", + "display_name": "deepseek/deepseek-v3.1-terminus", "limit": { "context": 4096, "output": 4096 @@ -70937,9 +82573,9 @@ "type": "chat" }, { - "id": "openai/gpt-5.1-chat", - "name": "openai/gpt-5.1-chat", - "display_name": "openai/gpt-5.1-chat", + "id": "deepseek/deepseek-v3.2", + "name": "deepseek/deepseek-v3.2", + "display_name": "deepseek/deepseek-v3.2", "limit": { "context": 4096, "output": 4096 @@ -70951,9 +82587,9 @@ "type": "chat" }, { - "id": "openai/gpt-5.1-codex", - "name": "openai/gpt-5.1-codex", - "display_name": "openai/gpt-5.1-codex", + "id": "deepseek/deepseek-v3.2-exp", + "name": "deepseek/deepseek-v3.2-exp", + "display_name": "deepseek/deepseek-v3.2-exp", "limit": { "context": 4096, "output": 4096 @@ -70965,9 +82601,9 @@ "type": "chat" }, { - "id": "openai/gpt-5.1-codex-max", - "name": "openai/gpt-5.1-codex-max", - "display_name": "openai/gpt-5.1-codex-max", + "id": "deepseek/deepseek-v3.2-speciale", + "name": "deepseek/deepseek-v3.2-speciale", + "display_name": "deepseek/deepseek-v3.2-speciale", "limit": { "context": 4096, "output": 4096 @@ -70979,9 +82615,9 @@ "type": "chat" }, { - "id": "openai/gpt-5.1-codex-mini", - "name": "openai/gpt-5.1-codex-mini", - "display_name": "openai/gpt-5.1-codex-mini", + "id": "google/gemini-2.0-flash-001", + "name": "google/gemini-2.0-flash-001", + "display_name": "google/gemini-2.0-flash-001", "limit": { "context": 4096, "output": 4096 @@ -70993,9 +82629,9 @@ "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "openai/gpt-5.2", - "display_name": "openai/gpt-5.2", + "id": "google/gemini-2.0-flash-lite-001", + "name": "google/gemini-2.0-flash-lite-001", + "display_name": "google/gemini-2.0-flash-lite-001", "limit": { "context": 4096, "output": 4096 @@ -71007,9 +82643,9 @@ "type": "chat" }, { - "id": "openai/gpt-5.2-chat", - "name": "openai/gpt-5.2-chat", - "display_name": "openai/gpt-5.2-chat", + "id": "google/gemini-2.5-flash", + "name": "google/gemini-2.5-flash", + "display_name": "google/gemini-2.5-flash", "limit": { "context": 4096, "output": 4096 @@ -71021,9 +82657,9 @@ "type": "chat" }, { - "id": "openai/gpt-5.2-pro", - "name": "openai/gpt-5.2-pro", - "display_name": "openai/gpt-5.2-pro", + "id": "google/gemini-2.5-flash-image", + "name": "google/gemini-2.5-flash-image", + "display_name": "google/gemini-2.5-flash-image", "limit": { "context": 4096, "output": 4096 @@ -71035,9 +82671,9 @@ "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "openai/gpt-oss-120b", - "display_name": "openai/gpt-oss-120b", + "id": "google/gemini-2.5-flash-lite", + "name": "google/gemini-2.5-flash-lite", + "display_name": "google/gemini-2.5-flash-lite", "limit": { "context": 4096, "output": 4096 @@ -71049,9 +82685,9 @@ "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "openai/gpt-oss-20b", - "display_name": "openai/gpt-oss-20b", + "id": "google/gemini-2.5-flash-lite-preview-09-2025", + "name": "google/gemini-2.5-flash-lite-preview-09-2025", + "display_name": "google/gemini-2.5-flash-lite-preview-09-2025", "limit": { "context": 4096, "output": 4096 @@ -71063,9 +82699,9 @@ "type": "chat" }, { - "id": "openai/gpt-oss-safeguard-20b", - "name": "openai/gpt-oss-safeguard-20b", - "display_name": "openai/gpt-oss-safeguard-20b", + "id": "google/gemini-2.5-flash-preview-09-2025", + "name": "google/gemini-2.5-flash-preview-09-2025", + "display_name": "google/gemini-2.5-flash-preview-09-2025", "limit": { "context": 4096, "output": 4096 @@ -71077,9 +82713,9 @@ "type": "chat" }, { - "id": "openai/o1", - "name": "openai/o1", - "display_name": "openai/o1", + "id": "google/gemini-2.5-pro", + "name": "google/gemini-2.5-pro", + "display_name": "google/gemini-2.5-pro", "limit": { "context": 4096, "output": 4096 @@ -71091,9 +82727,9 @@ "type": "chat" }, { - "id": "openai/o1-pro", - "name": "openai/o1-pro", - "display_name": "openai/o1-pro", + "id": "google/gemini-2.5-pro-preview", + "name": "google/gemini-2.5-pro-preview", + "display_name": "google/gemini-2.5-pro-preview", "limit": { "context": 4096, "output": 4096 @@ -71105,9 +82741,9 @@ "type": "chat" }, { - "id": "openai/o3", - "name": "openai/o3", - "display_name": "openai/o3", + "id": "google/gemini-2.5-pro-preview-05-06", + "name": "google/gemini-2.5-pro-preview-05-06", + "display_name": "google/gemini-2.5-pro-preview-05-06", "limit": { "context": 4096, "output": 4096 @@ -71119,9 +82755,9 @@ "type": "chat" }, { - "id": "openai/o3-deep-research", - "name": "openai/o3-deep-research", - "display_name": "openai/o3-deep-research", + "id": "google/gemini-3-flash-preview", + "name": "google/gemini-3-flash-preview", + "display_name": "google/gemini-3-flash-preview", "limit": { "context": 4096, "output": 4096 @@ -71133,9 +82769,9 @@ "type": "chat" }, { - "id": "openai/o3-mini", - "name": "openai/o3-mini", - "display_name": "openai/o3-mini", + "id": "google/gemini-3-pro-image-preview", + "name": "google/gemini-3-pro-image-preview", + "display_name": "google/gemini-3-pro-image-preview", "limit": { "context": 4096, "output": 4096 @@ -71147,9 +82783,9 @@ "type": "chat" }, { - "id": "openai/o3-mini-high", - "name": "openai/o3-mini-high", - "display_name": "openai/o3-mini-high", + "id": "google/gemini-3-pro-preview", + "name": "google/gemini-3-pro-preview", + "display_name": "google/gemini-3-pro-preview", "limit": { "context": 4096, "output": 4096 @@ -71161,9 +82797,9 @@ "type": "chat" }, { - "id": "openai/o3-pro", - "name": "openai/o3-pro", - "display_name": "openai/o3-pro", + "id": "google/gemma-2-27b-it", + "name": "google/gemma-2-27b-it", + "display_name": "google/gemma-2-27b-it", "limit": { "context": 4096, "output": 4096 @@ -71175,9 +82811,9 @@ "type": "chat" }, { - "id": "openai/o4-mini", - "name": "openai/o4-mini", - "display_name": "openai/o4-mini", + "id": "google/gemma-2-9b-it", + "name": "google/gemma-2-9b-it", + "display_name": "google/gemma-2-9b-it", "limit": { "context": 4096, "output": 4096 @@ -71189,9 +82825,9 @@ "type": "chat" }, { - "id": "openai/o4-mini-deep-research", - "name": "openai/o4-mini-deep-research", - "display_name": "openai/o4-mini-deep-research", + "id": "google/gemma-3-12b-it", + "name": "google/gemma-3-12b-it", + "display_name": "google/gemma-3-12b-it", "limit": { "context": 4096, "output": 4096 @@ -71203,9 +82839,9 @@ "type": "chat" }, { - "id": "openai/o4-mini-high", - "name": "openai/o4-mini-high", - "display_name": "openai/o4-mini-high", + "id": "google/gemma-3-27b-it", + "name": "google/gemma-3-27b-it", + "display_name": "google/gemma-3-27b-it", "limit": { "context": 4096, "output": 4096 @@ -71217,9 +82853,9 @@ "type": "chat" }, { - "id": "qwen/qwen-2.5-72b-instruct", - "name": "qwen/qwen-2.5-72b-instruct", - "display_name": "qwen/qwen-2.5-72b-instruct", + "id": "google/gemma-3-4b-it", + "name": "google/gemma-3-4b-it", + "display_name": "google/gemma-3-4b-it", "limit": { "context": 4096, "output": 4096 @@ -71231,9 +82867,9 @@ "type": "chat" }, { - "id": "qwen/qwen-2.5-7b-instruct", - "name": "qwen/qwen-2.5-7b-instruct", - "display_name": "qwen/qwen-2.5-7b-instruct", + "id": "google/gemma-3n-e4b-it", + "name": "google/gemma-3n-e4b-it", + "display_name": "google/gemma-3n-e4b-it", "limit": { "context": 4096, "output": 4096 @@ -71245,9 +82881,9 @@ "type": "chat" }, { - "id": "qwen/qwen-2.5-coder-32b-instruct", - "name": "qwen/qwen-2.5-coder-32b-instruct", - "display_name": "qwen/qwen-2.5-coder-32b-instruct", + "id": "minimax/minimax-01", + "name": "minimax/minimax-01", + "display_name": "minimax/minimax-01", "limit": { "context": 4096, "output": 4096 @@ -71259,9 +82895,9 @@ "type": "chat" }, { - "id": "qwen/qwen-2.5-vl-7b-instruct", - "name": "qwen/qwen-2.5-vl-7b-instruct", - "display_name": "qwen/qwen-2.5-vl-7b-instruct", + "id": "minimax/minimax-m1", + "name": "minimax/minimax-m1", + "display_name": "minimax/minimax-m1", "limit": { "context": 4096, "output": 4096 @@ -71273,9 +82909,9 @@ "type": "chat" }, { - "id": "qwen/qwen-max", - "name": "qwen/qwen-max", - "display_name": "qwen/qwen-max", + "id": "minimax/minimax-m2", + "name": "minimax/minimax-m2", + "display_name": "minimax/minimax-m2", "limit": { "context": 4096, "output": 4096 @@ -71287,9 +82923,9 @@ "type": "chat" }, { - "id": "qwen/qwen-plus", - "name": "qwen/qwen-plus", - "display_name": "qwen/qwen-plus", + "id": "minimax/minimax-m2-her", + "name": "minimax/minimax-m2-her", + "display_name": "minimax/minimax-m2-her", "limit": { "context": 4096, "output": 4096 @@ -71301,9 +82937,9 @@ "type": "chat" }, { - "id": "qwen/qwen-plus-2025-07-28", - "name": "qwen/qwen-plus-2025-07-28", - "display_name": "qwen/qwen-plus-2025-07-28", + "id": "minimax/minimax-m2.1", + "name": "minimax/minimax-m2.1", + "display_name": "minimax/minimax-m2.1", "limit": { "context": 4096, "output": 4096 @@ -71315,9 +82951,9 @@ "type": "chat" }, { - "id": "qwen/qwen-turbo", - "name": "qwen/qwen-turbo", - "display_name": "qwen/qwen-turbo", + "id": "moonshotai/kimi-dev-72b", + "name": "moonshotai/kimi-dev-72b", + "display_name": "moonshotai/kimi-dev-72b", "limit": { "context": 4096, "output": 4096 @@ -71329,9 +82965,9 @@ "type": "chat" }, { - "id": "qwen/qwen-vl-max", - "name": "qwen/qwen-vl-max", - "display_name": "qwen/qwen-vl-max", + "id": "moonshotai/kimi-k2", + "name": "moonshotai/kimi-k2", + "display_name": "moonshotai/kimi-k2", "limit": { "context": 4096, "output": 4096 @@ -71343,9 +82979,9 @@ "type": "chat" }, { - "id": "qwen/qwen-vl-plus", - "name": "qwen/qwen-vl-plus", - "display_name": "qwen/qwen-vl-plus", + "id": "moonshotai/kimi-k2-0905", + "name": "moonshotai/kimi-k2-0905", + "display_name": "moonshotai/kimi-k2-0905", "limit": { "context": 4096, "output": 4096 @@ -71357,9 +82993,9 @@ "type": "chat" }, { - "id": "qwen/qwen2.5-coder-7b-instruct", - "name": "qwen/qwen2.5-coder-7b-instruct", - "display_name": "qwen/qwen2.5-coder-7b-instruct", + "id": "moonshotai/kimi-k2-thinking", + "name": "moonshotai/kimi-k2-thinking", + "display_name": "moonshotai/kimi-k2-thinking", "limit": { "context": 4096, "output": 4096 @@ -71371,9 +83007,9 @@ "type": "chat" }, { - "id": "qwen/qwen2.5-vl-32b-instruct", - "name": "qwen/qwen2.5-vl-32b-instruct", - "display_name": "qwen/qwen2.5-vl-32b-instruct", + "id": "moonshotai/kimi-k2.5", + "name": "moonshotai/kimi-k2.5", + "display_name": "moonshotai/kimi-k2.5", "limit": { "context": 4096, "output": 4096 @@ -71385,9 +83021,9 @@ "type": "chat" }, { - "id": "qwen/qwen2.5-vl-72b-instruct", - "name": "qwen/qwen2.5-vl-72b-instruct", - "display_name": "qwen/qwen2.5-vl-72b-instruct", + "id": "morph/morph-v3-fast", + "name": "morph/morph-v3-fast", + "display_name": "morph/morph-v3-fast", "limit": { "context": 4096, "output": 4096 @@ -71399,9 +83035,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-14b", - "name": "qwen/qwen3-14b", - "display_name": "qwen/qwen3-14b", + "id": "morph/morph-v3-large", + "name": "morph/morph-v3-large", + "display_name": "morph/morph-v3-large", "limit": { "context": 4096, "output": 4096 @@ -71413,9 +83049,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b", - "name": "qwen/qwen3-235b-a22b", - "display_name": "qwen/qwen3-235b-a22b", + "id": "openai/chatgpt-4o-latest", + "name": "openai/chatgpt-4o-latest", + "display_name": "openai/chatgpt-4o-latest", "limit": { "context": 4096, "output": 4096 @@ -71427,9 +83063,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-2507", - "name": "qwen/qwen3-235b-a22b-2507", - "display_name": "qwen/qwen3-235b-a22b-2507", + "id": "openai/gpt-3.5-turbo", + "name": "openai/gpt-3.5-turbo", + "display_name": "openai/gpt-3.5-turbo", "limit": { "context": 4096, "output": 4096 @@ -71441,9 +83077,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-thinking-2507", - "name": "qwen/qwen3-235b-a22b-thinking-2507", - "display_name": "qwen/qwen3-235b-a22b-thinking-2507", + "id": "openai/gpt-3.5-turbo-0613", + "name": "openai/gpt-3.5-turbo-0613", + "display_name": "openai/gpt-3.5-turbo-0613", "limit": { "context": 4096, "output": 4096 @@ -71455,9 +83091,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-30b-a3b", - "name": "qwen/qwen3-30b-a3b", - "display_name": "qwen/qwen3-30b-a3b", + "id": "openai/gpt-3.5-turbo-16k", + "name": "openai/gpt-3.5-turbo-16k", + "display_name": "openai/gpt-3.5-turbo-16k", "limit": { "context": 4096, "output": 4096 @@ -71469,9 +83105,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-30b-a3b-instruct-2507", - "name": "qwen/qwen3-30b-a3b-instruct-2507", - "display_name": "qwen/qwen3-30b-a3b-instruct-2507", + "id": "openai/gpt-3.5-turbo-instruct", + "name": "openai/gpt-3.5-turbo-instruct", + "display_name": "openai/gpt-3.5-turbo-instruct", "limit": { "context": 4096, "output": 4096 @@ -71483,9 +83119,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-30b-a3b-thinking-2507", - "name": "qwen/qwen3-30b-a3b-thinking-2507", - "display_name": "qwen/qwen3-30b-a3b-thinking-2507", + "id": "openai/gpt-4", + "name": "openai/gpt-4", + "display_name": "openai/gpt-4", "limit": { "context": 4096, "output": 4096 @@ -71497,9 +83133,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-32b", - "name": "qwen/qwen3-32b", - "display_name": "qwen/qwen3-32b", + "id": "openai/gpt-4-0314", + "name": "openai/gpt-4-0314", + "display_name": "openai/gpt-4-0314", "limit": { "context": 4096, "output": 4096 @@ -71511,9 +83147,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-8b", - "name": "qwen/qwen3-8b", - "display_name": "qwen/qwen3-8b", + "id": "openai/gpt-4-1106-preview", + "name": "openai/gpt-4-1106-preview", + "display_name": "openai/gpt-4-1106-preview", "limit": { "context": 4096, "output": 4096 @@ -71525,9 +83161,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-coder", - "name": "qwen/qwen3-coder", - "display_name": "qwen/qwen3-coder", + "id": "openai/gpt-4-turbo", + "name": "openai/gpt-4-turbo", + "display_name": "openai/gpt-4-turbo", "limit": { "context": 4096, "output": 4096 @@ -71539,9 +83175,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-coder-30b-a3b-instruct", - "name": "qwen/qwen3-coder-30b-a3b-instruct", - "display_name": "qwen/qwen3-coder-30b-a3b-instruct", + "id": "openai/gpt-4-turbo-preview", + "name": "openai/gpt-4-turbo-preview", + "display_name": "openai/gpt-4-turbo-preview", "limit": { "context": 4096, "output": 4096 @@ -71553,9 +83189,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-coder-flash", - "name": "qwen/qwen3-coder-flash", - "display_name": "qwen/qwen3-coder-flash", + "id": "openai/gpt-4.1", + "name": "openai/gpt-4.1", + "display_name": "openai/gpt-4.1", "limit": { "context": 4096, "output": 4096 @@ -71567,9 +83203,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-coder-plus", - "name": "qwen/qwen3-coder-plus", - "display_name": "qwen/qwen3-coder-plus", + "id": "openai/gpt-4.1-mini", + "name": "openai/gpt-4.1-mini", + "display_name": "openai/gpt-4.1-mini", "limit": { "context": 4096, "output": 4096 @@ -71581,9 +83217,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-max", - "name": "qwen/qwen3-max", - "display_name": "qwen/qwen3-max", + "id": "openai/gpt-4.1-nano", + "name": "openai/gpt-4.1-nano", + "display_name": "openai/gpt-4.1-nano", "limit": { "context": 4096, "output": 4096 @@ -71595,9 +83231,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-next-80b-a3b-instruct", - "name": "qwen/qwen3-next-80b-a3b-instruct", - "display_name": "qwen/qwen3-next-80b-a3b-instruct", + "id": "openai/gpt-4o", + "name": "openai/gpt-4o", + "display_name": "openai/gpt-4o", "limit": { "context": 4096, "output": 4096 @@ -71609,9 +83245,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-next-80b-a3b-thinking", - "name": "qwen/qwen3-next-80b-a3b-thinking", - "display_name": "qwen/qwen3-next-80b-a3b-thinking", + "id": "openai/gpt-4o-2024-05-13", + "name": "openai/gpt-4o-2024-05-13", + "display_name": "openai/gpt-4o-2024-05-13", "limit": { "context": 4096, "output": 4096 @@ -71623,9 +83259,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-vl-235b-a22b-instruct", - "name": "qwen/qwen3-vl-235b-a22b-instruct", - "display_name": "qwen/qwen3-vl-235b-a22b-instruct", + "id": "openai/gpt-4o-2024-08-06", + "name": "openai/gpt-4o-2024-08-06", + "display_name": "openai/gpt-4o-2024-08-06", "limit": { "context": 4096, "output": 4096 @@ -71637,9 +83273,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-vl-235b-a22b-thinking", - "name": "qwen/qwen3-vl-235b-a22b-thinking", - "display_name": "qwen/qwen3-vl-235b-a22b-thinking", + "id": "openai/gpt-4o-2024-11-20", + "name": "openai/gpt-4o-2024-11-20", + "display_name": "openai/gpt-4o-2024-11-20", "limit": { "context": 4096, "output": 4096 @@ -71651,9 +83287,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-vl-30b-a3b-instruct", - "name": "qwen/qwen3-vl-30b-a3b-instruct", - "display_name": "qwen/qwen3-vl-30b-a3b-instruct", + "id": "openai/gpt-4o-audio-preview", + "name": "openai/gpt-4o-audio-preview", + "display_name": "openai/gpt-4o-audio-preview", "limit": { "context": 4096, "output": 4096 @@ -71665,9 +83301,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-vl-30b-a3b-thinking", - "name": "qwen/qwen3-vl-30b-a3b-thinking", - "display_name": "qwen/qwen3-vl-30b-a3b-thinking", + "id": "openai/gpt-4o-mini", + "name": "openai/gpt-4o-mini", + "display_name": "openai/gpt-4o-mini", "limit": { "context": 4096, "output": 4096 @@ -71679,9 +83315,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-vl-32b-instruct", - "name": "qwen/qwen3-vl-32b-instruct", - "display_name": "qwen/qwen3-vl-32b-instruct", + "id": "openai/gpt-4o-mini-2024-07-18", + "name": "openai/gpt-4o-mini-2024-07-18", + "display_name": "openai/gpt-4o-mini-2024-07-18", "limit": { "context": 4096, "output": 4096 @@ -71693,9 +83329,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-vl-8b-instruct", - "name": "qwen/qwen3-vl-8b-instruct", - "display_name": "qwen/qwen3-vl-8b-instruct", + "id": "openai/gpt-4o-mini-search-preview", + "name": "openai/gpt-4o-mini-search-preview", + "display_name": "openai/gpt-4o-mini-search-preview", "limit": { "context": 4096, "output": 4096 @@ -71707,9 +83343,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-vl-8b-thinking", - "name": "qwen/qwen3-vl-8b-thinking", - "display_name": "qwen/qwen3-vl-8b-thinking", + "id": "openai/gpt-4o-search-preview", + "name": "openai/gpt-4o-search-preview", + "display_name": "openai/gpt-4o-search-preview", "limit": { "context": 4096, "output": 4096 @@ -71721,9 +83357,9 @@ "type": "chat" }, { - "id": "qwen/qwq-32b", - "name": "qwen/qwq-32b", - "display_name": "qwen/qwq-32b", + "id": "openai/gpt-5", + "name": "openai/gpt-5", + "display_name": "openai/gpt-5", "limit": { "context": 4096, "output": 4096 @@ -71735,9 +83371,9 @@ "type": "chat" }, { - "id": "x-ai/grok-3", - "name": "x-ai/grok-3", - "display_name": "x-ai/grok-3", + "id": "openai/gpt-5-chat", + "name": "openai/gpt-5-chat", + "display_name": "openai/gpt-5-chat", "limit": { "context": 4096, "output": 4096 @@ -71749,9 +83385,9 @@ "type": "chat" }, { - "id": "x-ai/grok-3-beta", - "name": "x-ai/grok-3-beta", - "display_name": "x-ai/grok-3-beta", + "id": "openai/gpt-5-codex", + "name": "openai/gpt-5-codex", + "display_name": "openai/gpt-5-codex", "limit": { "context": 4096, "output": 4096 @@ -71763,9 +83399,9 @@ "type": "chat" }, { - "id": "x-ai/grok-3-mini", - "name": "x-ai/grok-3-mini", - "display_name": "x-ai/grok-3-mini", + "id": "openai/gpt-5-image", + "name": "openai/gpt-5-image", + "display_name": "openai/gpt-5-image", "limit": { "context": 4096, "output": 4096 @@ -71777,9 +83413,9 @@ "type": "chat" }, { - "id": "x-ai/grok-3-mini-beta", - "name": "x-ai/grok-3-mini-beta", - "display_name": "x-ai/grok-3-mini-beta", + "id": "openai/gpt-5-image-mini", + "name": "openai/gpt-5-image-mini", + "display_name": "openai/gpt-5-image-mini", "limit": { "context": 4096, "output": 4096 @@ -71791,9 +83427,9 @@ "type": "chat" }, { - "id": "x-ai/grok-4", - "name": "x-ai/grok-4", - "display_name": "x-ai/grok-4", + "id": "openai/gpt-5-mini", + "name": "openai/gpt-5-mini", + "display_name": "openai/gpt-5-mini", "limit": { "context": 4096, "output": 4096 @@ -71805,9 +83441,9 @@ "type": "chat" }, { - "id": "x-ai/grok-4-fast", - "name": "x-ai/grok-4-fast", - "display_name": "x-ai/grok-4-fast", + "id": "openai/gpt-5-nano", + "name": "openai/gpt-5-nano", + "display_name": "openai/gpt-5-nano", "limit": { "context": 4096, "output": 4096 @@ -71819,9 +83455,9 @@ "type": "chat" }, { - "id": "x-ai/grok-4.1-fast", - "name": "x-ai/grok-4.1-fast", - "display_name": "x-ai/grok-4.1-fast", + "id": "openai/gpt-5-pro", + "name": "openai/gpt-5-pro", + "display_name": "openai/gpt-5-pro", "limit": { "context": 4096, "output": 4096 @@ -71833,9 +83469,9 @@ "type": "chat" }, { - "id": "x-ai/grok-code-fast-1", - "name": "x-ai/grok-code-fast-1", - "display_name": "x-ai/grok-code-fast-1", + "id": "openai/gpt-5.1", + "name": "openai/gpt-5.1", + "display_name": "openai/gpt-5.1", "limit": { "context": 4096, "output": 4096 @@ -71847,9 +83483,9 @@ "type": "chat" }, { - "id": "z-ai/glm-4-32b", - "name": "z-ai/glm-4-32b", - "display_name": "z-ai/glm-4-32b", + "id": "openai/gpt-5.1-chat", + "name": "openai/gpt-5.1-chat", + "display_name": "openai/gpt-5.1-chat", "limit": { "context": 4096, "output": 4096 @@ -71861,9 +83497,9 @@ "type": "chat" }, { - "id": "z-ai/glm-4.5", - "name": "z-ai/glm-4.5", - "display_name": "z-ai/glm-4.5", + "id": "openai/gpt-5.1-codex", + "name": "openai/gpt-5.1-codex", + "display_name": "openai/gpt-5.1-codex", "limit": { "context": 4096, "output": 4096 @@ -71875,9 +83511,9 @@ "type": "chat" }, { - "id": "z-ai/glm-4.5-air", - "name": "z-ai/glm-4.5-air", - "display_name": "z-ai/glm-4.5-air", + "id": "openai/gpt-5.1-codex-max", + "name": "openai/gpt-5.1-codex-max", + "display_name": "openai/gpt-5.1-codex-max", "limit": { "context": 4096, "output": 4096 @@ -71889,9 +83525,9 @@ "type": "chat" }, { - "id": "z-ai/glm-4.5v", - "name": "z-ai/glm-4.5v", - "display_name": "z-ai/glm-4.5v", + "id": "openai/gpt-5.1-codex-mini", + "name": "openai/gpt-5.1-codex-mini", + "display_name": "openai/gpt-5.1-codex-mini", "limit": { "context": 4096, "output": 4096 @@ -71903,9 +83539,9 @@ "type": "chat" }, { - "id": "z-ai/glm-4.6", - "name": "z-ai/glm-4.6", - "display_name": "z-ai/glm-4.6", + "id": "openai/gpt-5.2", + "name": "openai/gpt-5.2", + "display_name": "openai/gpt-5.2", "limit": { "context": 4096, "output": 4096 @@ -71917,9 +83553,9 @@ "type": "chat" }, { - "id": "z-ai/glm-4.6v", - "name": "z-ai/glm-4.6v", - "display_name": "z-ai/glm-4.6v", + "id": "openai/gpt-5.2-chat", + "name": "openai/gpt-5.2-chat", + "display_name": "openai/gpt-5.2-chat", "limit": { "context": 4096, "output": 4096 @@ -71931,9 +83567,9 @@ "type": "chat" }, { - "id": "z-ai/glm-4.7", - "name": "z-ai/glm-4.7", - "display_name": "z-ai/glm-4.7", + "id": "openai/gpt-5.2-codex", + "name": "openai/gpt-5.2-codex", + "display_name": "openai/gpt-5.2-codex", "limit": { "context": 4096, "output": 4096 @@ -71943,1722 +83579,984 @@ "supported": false }, "type": "chat" - } - ] - }, - "aihubmix": { - "id": "aihubmix", - "name": "AIHubMix", - "display_name": "AIHubMix", - "models": [ - { - "id": "gemini-3-flash-preview", - "name": "gemini-3-flash-preview", - "display_name": "gemini-3-flash-preview", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video" - ] - }, - "limit": { - "context": 1048576, - "output": 1048576 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 - }, - "type": "chat" }, { - "id": "gemini-3-flash-preview-search", - "name": "gemini-3-flash-preview-search", - "display_name": "gemini-3-flash-preview-search", - "modalities": { - "input": [ - "text", - "image", - "audio" - ] - }, + "id": "openai/gpt-5.2-pro", + "name": "openai/gpt-5.2-pro", + "display_name": "openai/gpt-5.2-pro", "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 + "supported": false }, "type": "chat" }, { - "id": "claude-opus-4-5", - "name": "claude-opus-4-5", - "display_name": "claude-opus-4-5", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "openai/gpt-audio", + "name": "openai/gpt-audio", + "display_name": "openai/gpt-audio", "limit": { - "context": 200000, - "output": 200000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5 + "supported": false }, "type": "chat" }, { - "id": "gemini-3-flash-preview-free", - "name": "gemini-3-flash-preview-free", - "display_name": "gemini-3-flash-preview-free", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video" - ] - }, + "id": "openai/gpt-audio-mini", + "name": "openai/gpt-audio-mini", + "display_name": "openai/gpt-audio-mini", "limit": { - "context": 1048576, - "output": 1048576 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "supported": false }, "type": "chat" }, { - "id": "glm-4.7", - "name": "glm-4.7", - "display_name": "glm-4.7", - "modalities": { - "input": [ - "text" - ] - }, + "id": "openai/gpt-oss-120b", + "name": "openai/gpt-oss-120b", + "display_name": "openai/gpt-oss-120b", "limit": { - "context": 200000, - "output": 200000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 0.273974, - "output": 1.095896, - "cache_read": 0.054795 + "supported": false }, "type": "chat" }, { - "id": "gemini-2.0-flash-free", - "name": "gemini-2.0-flash-free", - "display_name": "gemini-2.0-flash-free", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video" - ] - }, + "id": "openai/gpt-oss-20b", + "name": "openai/gpt-oss-20b", + "display_name": "openai/gpt-oss-20b", "limit": { - "context": 1048576, - "output": 1048576 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 0, - "output": 0, - "cache_read": 0 - }, "type": "chat" }, { - "id": "coding-glm-4.7-free", - "name": "coding-glm-4.7-free", - "display_name": "coding-glm-4.7-free", - "modalities": { - "input": [ - "text" - ] - }, + "id": "openai/gpt-oss-safeguard-20b", + "name": "openai/gpt-oss-safeguard-20b", + "display_name": "openai/gpt-oss-safeguard-20b", "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "supported": false }, "type": "chat" }, { - "id": "gemini-3-pro-image-preview", - "name": "gemini-3-pro-image-preview", - "display_name": "gemini-3-pro-image-preview", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "openai/o1", + "name": "openai/o1", + "display_name": "openai/o1", "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 2, - "output": 12, - "cache_read": 2 - }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "gpt-image-1.5", - "name": "gpt-image-1.5", - "display_name": "gpt-image-1.5", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "openai/o1-pro", + "name": "openai/o1-pro", + "display_name": "openai/o1-pro", "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 5, - "output": 10, - "cache_read": 5 - }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "gpt-5.2", - "name": "gpt-5.2", - "display_name": "gpt-5.2", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "openai/o3", + "name": "openai/o3", + "display_name": "openai/o3", "limit": { - "context": 400000, - "output": 400000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "supported": false }, "type": "chat" }, { - "id": "gpt-5.2-chat-latest", - "name": "gpt-5.2-chat-latest", - "display_name": "gpt-5.2-chat-latest", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "openai/o3-deep-research", + "name": "openai/o3-deep-research", + "display_name": "openai/o3-deep-research", "limit": { - "context": 128000, - "output": 128000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 - }, "type": "chat" }, { - "id": "gemini-3-pro-preview", - "name": "gemini-3-pro-preview", - "display_name": "gemini-3-pro-preview", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video" - ] - }, + "id": "openai/o3-mini", + "name": "openai/o3-mini", + "display_name": "openai/o3-mini", "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2 + "supported": false }, "type": "chat" }, { - "id": "gpt-5.2-pro", - "name": "gpt-5.2-pro", - "display_name": "gpt-5.2-pro", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "openai/o3-mini-high", + "name": "openai/o3-mini-high", + "display_name": "openai/o3-mini-high", "limit": { - "context": 400000, - "output": 400000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 21, - "output": 168, - "cache_read": 2.1 + "supported": false }, "type": "chat" }, { - "id": "gpt-5.1", - "name": "gpt-5.1", - "display_name": "gpt-5.1", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "openai/o3-pro", + "name": "openai/o3-pro", + "display_name": "openai/o3-pro", "limit": { - "context": 400000, - "output": 400000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "supported": false }, "type": "chat" }, { - "id": "gpt-5.1-codex-max", - "name": "gpt-5.1-codex-max", - "display_name": "gpt-5.1-codex-max", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "openai/o4-mini", + "name": "openai/o4-mini", + "display_name": "openai/o4-mini", "limit": { - "context": 400000, - "output": 400000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "supported": false }, "type": "chat" }, { - "id": "gemini-3-pro-preview-search", - "name": "gemini-3-pro-preview-search", - "display_name": "gemini-3-pro-preview-search", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video" - ] - }, + "id": "openai/o4-mini-deep-research", + "name": "openai/o4-mini-deep-research", + "display_name": "openai/o4-mini-deep-research", "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2 + "supported": false }, "type": "chat" }, { - "id": "gpt-5.1-chat-latest", - "name": "gpt-5.1-chat-latest", - "display_name": "gpt-5.1-chat-latest", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "openai/o4-mini-high", + "name": "openai/o4-mini-high", + "display_name": "openai/o4-mini-high", "limit": { - "context": 128000, - "output": 128000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 - }, "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "gpt-5.1-codex", - "display_name": "gpt-5.1-codex", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "qwen/qwen-2.5-72b-instruct", + "name": "qwen/qwen-2.5-72b-instruct", + "display_name": "qwen/qwen-2.5-72b-instruct", "limit": { - "context": 400000, - "output": 400000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "supported": false }, "type": "chat" }, { - "id": "gpt-5.1-codex-mini", - "name": "gpt-5.1-codex-mini", - "display_name": "gpt-5.1-codex-mini", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "qwen/qwen-2.5-7b-instruct", + "name": "qwen/qwen-2.5-7b-instruct", + "display_name": "qwen/qwen-2.5-7b-instruct", "limit": { - "context": 400000, - "output": 400000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "supported": false }, "type": "chat" }, { - "id": "doubao-seed-1-8", - "name": "doubao-seed-1-8", - "display_name": "doubao-seed-1-8", - "modalities": { - "input": [ - "text", - "image", - "video" - ] - }, + "id": "qwen/qwen-2.5-coder-32b-instruct", + "name": "qwen/qwen-2.5-coder-32b-instruct", + "display_name": "qwen/qwen-2.5-coder-32b-instruct", "limit": { - "context": 256000, - "output": 256000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 0.10959, - "output": 0.273975, - "cache_read": 0.021918 + "supported": false }, "type": "chat" }, { - "id": "claude-haiku-4-5", - "name": "claude-haiku-4-5", - "display_name": "claude-haiku-4-5", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "qwen/qwen-2.5-vl-7b-instruct", + "name": "qwen/qwen-2.5-vl-7b-instruct", + "display_name": "qwen/qwen-2.5-vl-7b-instruct", "limit": { - "context": 204800, - "output": 204800 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 1.1, - "output": 5.5, - "cache_read": 0.11 + "supported": false }, "type": "chat" }, { - "id": "claude-sonnet-4-5", - "name": "claude-sonnet-4-5", - "display_name": "claude-sonnet-4-5", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "qwen/qwen-max", + "name": "qwen/qwen-max", + "display_name": "qwen/qwen-max", "limit": { - "context": 1000000, - "output": 1000000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 3.3, - "output": 16.5, - "cache_read": 0.33 + "supported": false }, "type": "chat" }, { - "id": "mistral-large-3", - "name": "mistral-large-3", - "display_name": "mistral-large-3", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "qwen/qwen-plus", + "name": "qwen/qwen-plus", + "display_name": "qwen/qwen-plus", "limit": { - "context": 256000, - "output": 256000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 0.5, - "output": 1.5 - }, "type": "chat" }, { - "id": "gemini-2.5-flash-image", - "name": "gemini-2.5-flash-image", - "display_name": "gemini-2.5-flash-image", - "modalities": { - "input": [ - "image", - "text" - ] - }, + "id": "qwen/qwen-plus-2025-07-28", + "name": "qwen/qwen-plus-2025-07-28", + "display_name": "qwen/qwen-plus-2025-07-28", "limit": { - "context": 32800, - "output": 32800 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 0.3, - "output": 2.499, - "cache_read": 0.3 - }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "grok-4-1-fast-non-reasoning", - "name": "grok-4-1-fast-non-reasoning", - "display_name": "grok-4-1-fast-non-reasoning", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "qwen/qwen-turbo", + "name": "qwen/qwen-turbo", + "display_name": "qwen/qwen-turbo", "limit": { - "context": 2000000, - "output": 2000000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "supported": false }, "type": "chat" }, { - "id": "grok-4-1-fast-reasoning", - "name": "grok-4-1-fast-reasoning", - "display_name": "grok-4-1-fast-reasoning", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "qwen/qwen-vl-max", + "name": "qwen/qwen-vl-max", + "display_name": "qwen/qwen-vl-max", "limit": { - "context": 2000000, - "output": 2000000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "supported": false }, "type": "chat" }, { - "id": "mimo-v2-flash", - "name": "mimo-v2-flash", - "display_name": "mimo-v2-flash", - "modalities": { - "input": [ - "text" - ] - }, + "id": "qwen/qwen-vl-plus", + "name": "qwen/qwen-vl-plus", + "display_name": "qwen/qwen-vl-plus", "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 0.1918, - "output": 0.5754, - "cache_read": 0.03836 - }, "type": "chat" }, { - "id": "web-gpt-image-1.5", - "name": "web-gpt-image-1.5", - "display_name": "web-gpt-image-1.5", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "qwen/qwen2.5-coder-7b-instruct", + "name": "qwen/qwen2.5-coder-7b-instruct", + "display_name": "qwen/qwen2.5-coder-7b-instruct", "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 3, - "output": 3, - "cache_read": 0 + "reasoning": { + "supported": false }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "gpt-5", - "name": "gpt-5", - "display_name": "gpt-5", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "qwen/qwen2.5-vl-32b-instruct", + "name": "qwen/qwen2.5-vl-32b-instruct", + "display_name": "qwen/qwen2.5-vl-32b-instruct", "limit": { - "context": 400000, - "output": 400000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "supported": false }, "type": "chat" }, { - "id": "deepseek-v3.2-fast", - "name": "deepseek-v3.2-fast", - "display_name": "deepseek-v3.2-fast", - "modalities": { - "input": [ - "text" - ] - }, + "id": "qwen/qwen2.5-vl-72b-instruct", + "name": "qwen/qwen2.5-vl-72b-instruct", + "display_name": "qwen/qwen2.5-vl-72b-instruct", "limit": { - "context": 128000, - "output": 128000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 1.096, - "output": 3.288, - "cache_read": 1.096 - }, "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "deepseek-v3.2", - "display_name": "deepseek-v3.2", - "modalities": { - "input": [ - "text" - ] - }, + "id": "qwen/qwen3-14b", + "name": "qwen/qwen3-14b", + "display_name": "qwen/qwen3-14b", "limit": { - "context": 128000, - "output": 128000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 0.302, - "output": 0.453, - "cache_read": 0.0302 - }, "type": "chat" }, { - "id": "deepseek-v3.2-speciale", - "name": "deepseek-v3.2-speciale", - "display_name": "deepseek-v3.2-speciale", - "modalities": { - "input": [ - "text" - ] - }, + "id": "qwen/qwen3-235b-a22b", + "name": "qwen/qwen3-235b-a22b", + "display_name": "qwen/qwen3-235b-a22b", "limit": { - "context": 128000, - "output": 128000 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 0.58, - "output": 1.680028 + "supported": false }, "type": "chat" }, { - "id": "deepseek-v3.2-think", - "name": "deepseek-v3.2-think", - "display_name": "deepseek-v3.2-think", - "modalities": { - "input": [ - "text" - ] - }, + "id": "qwen/qwen3-235b-a22b-2507", + "name": "qwen/qwen3-235b-a22b-2507", + "display_name": "qwen/qwen3-235b-a22b-2507", "limit": { - "context": 128000, - "output": 128000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 0.302, - "output": 0.453, - "cache_read": 0.0302 - }, "type": "chat" }, { - "id": "deepseek-math-v2", - "name": "deepseek-math-v2", - "display_name": "deepseek-math-v2", - "modalities": { - "input": [ - "text" - ] - }, + "id": "qwen/qwen3-235b-a22b-thinking-2507", + "name": "qwen/qwen3-235b-a22b-thinking-2507", + "display_name": "qwen/qwen3-235b-a22b-thinking-2507", "limit": { - "context": 163000, - "output": 163000 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 0.492, - "output": 1.968, - "cache_read": 0.0984 + "supported": false }, "type": "chat" }, { - "id": "DeepSeek-V3.2-Exp", - "name": "DeepSeek-V3.2-Exp", - "display_name": "DeepSeek-V3.2-Exp", - "modalities": { - "input": [ - "text" - ] - }, + "id": "qwen/qwen3-30b-a3b", + "name": "qwen/qwen3-30b-a3b", + "display_name": "qwen/qwen3-30b-a3b", "limit": { - "context": 163000, - "output": 163000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 0.274, - "output": 0.411, - "cache_read": 0.0274 - }, "type": "chat" }, { - "id": "DeepSeek-V3.2-Exp-Think", - "name": "DeepSeek-V3.2-Exp-Think", - "display_name": "DeepSeek-V3.2-Exp-Think", - "modalities": { - "input": [ - "text" - ] - }, + "id": "qwen/qwen3-30b-a3b-instruct-2507", + "name": "qwen/qwen3-30b-a3b-instruct-2507", + "display_name": "qwen/qwen3-30b-a3b-instruct-2507", "limit": { - "context": 131000, - "output": 131000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 0.274, - "output": 0.411, - "cache_read": 0.0274 + "supported": false }, "type": "chat" }, { - "id": "gpt-5-codex", - "name": "gpt-5-codex", - "display_name": "gpt-5-codex", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "qwen/qwen3-30b-a3b-thinking-2507", + "name": "qwen/qwen3-30b-a3b-thinking-2507", + "display_name": "qwen/qwen3-30b-a3b-thinking-2507", "limit": { - "context": 400000, - "output": 400000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "supported": false }, "type": "chat" }, { - "id": "DeepSeek-V3.1-Terminus", - "name": "DeepSeek-V3.1-Terminus", - "display_name": "DeepSeek-V3.1-Terminus", - "modalities": { - "input": [ - "text" - ] - }, + "id": "qwen/qwen3-32b", + "name": "qwen/qwen3-32b", + "display_name": "qwen/qwen3-32b", "limit": { - "context": 160000, - "output": 160000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 0.56, - "output": 1.68 - }, "type": "chat" }, { - "id": "DeepSeek-V3.1-Think", - "name": "DeepSeek-V3.1-Think", - "display_name": "DeepSeek-V3.1-Think", - "modalities": { - "input": [ - "text" - ] - }, + "id": "qwen/qwen3-8b", + "name": "qwen/qwen3-8b", + "display_name": "qwen/qwen3-8b", "limit": { - "context": 128000, - "output": 128000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 0.56, - "output": 1.68 + "supported": false }, "type": "chat" }, { - "id": "gpt-5-pro", - "name": "gpt-5-pro", - "display_name": "gpt-5-pro", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "qwen/qwen3-coder", + "name": "qwen/qwen3-coder", + "display_name": "qwen/qwen3-coder", "limit": { - "context": 400000, - "output": 400000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 15, - "output": 120 + "supported": false }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "gpt-5-mini", - "display_name": "gpt-5-mini", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "qwen/qwen3-coder-30b-a3b-instruct", + "name": "qwen/qwen3-coder-30b-a3b-instruct", + "display_name": "qwen/qwen3-coder-30b-a3b-instruct", "limit": { - "context": 400000, - "output": 400000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "supported": false }, "type": "chat" }, { - "id": "gpt-5-nano", - "name": "gpt-5-nano", - "display_name": "gpt-5-nano", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "qwen/qwen3-coder-flash", + "name": "qwen/qwen3-coder-flash", + "display_name": "qwen/qwen3-coder-flash", "limit": { - "context": 400000, - "output": 400000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 + "supported": false }, "type": "chat" }, { - "id": "gpt-5-chat-latest", - "name": "gpt-5-chat-latest", - "display_name": "gpt-5-chat-latest", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "qwen/qwen3-coder-plus", + "name": "qwen/qwen3-coder-plus", + "display_name": "qwen/qwen3-coder-plus", "limit": { - "context": 400000, - "output": 400000 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 - }, "type": "chat" }, { - "id": "claude-opus-4-1", - "name": "claude-opus-4-1", - "display_name": "claude-opus-4-1", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "qwen/qwen3-max", + "name": "qwen/qwen3-max", + "display_name": "qwen/qwen3-max", "limit": { - "context": 200000, - "output": 200000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 16.5, - "output": 82.5 + "supported": false }, "type": "chat" }, { - "id": "doubao-seedream-4-5", - "name": "doubao-seedream-4-5", - "display_name": "doubao-seedream-4-5", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "qwen/qwen3-next-80b-a3b-instruct", + "name": "qwen/qwen3-next-80b-a3b-instruct", + "display_name": "qwen/qwen3-next-80b-a3b-instruct", "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 2, - "output": 0, - "cache_read": 0 - }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "sora-2", - "name": "sora-2", - "display_name": "sora-2", + "id": "qwen/qwen3-next-80b-a3b-thinking", + "name": "qwen/qwen3-next-80b-a3b-thinking", + "display_name": "qwen/qwen3-next-80b-a3b-thinking", "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 2, - "output": 2 - }, "type": "chat" }, { - "id": "sora-2-pro", - "name": "sora-2-pro", - "display_name": "sora-2-pro", + "id": "qwen/qwen3-vl-235b-a22b-instruct", + "name": "qwen/qwen3-vl-235b-a22b-instruct", + "display_name": "qwen/qwen3-vl-235b-a22b-instruct", "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 2, - "output": 2 - }, "type": "chat" }, { - "id": "o3", - "name": "o3", - "display_name": "o3", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "qwen/qwen3-vl-235b-a22b-thinking", + "name": "qwen/qwen3-vl-235b-a22b-thinking", + "display_name": "qwen/qwen3-vl-235b-a22b-thinking", "limit": { - "context": 200000, - "output": 200000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "supported": false }, "type": "chat" }, { - "id": "wan2.6-i2v", - "name": "wan2.6-i2v", - "display_name": "wan2.6-i2v", - "modalities": { - "input": [ - "image", - "text" - ] - }, + "id": "qwen/qwen3-vl-30b-a3b-instruct", + "name": "qwen/qwen3-vl-30b-a3b-instruct", + "display_name": "qwen/qwen3-vl-30b-a3b-instruct", "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 2, - "output": 0 - }, "type": "chat" }, { - "id": "wan2.6-t2v", - "name": "wan2.6-t2v", - "display_name": "wan2.6-t2v", - "modalities": { - "input": [ - "text" - ] - }, + "id": "qwen/qwen3-vl-30b-a3b-thinking", + "name": "qwen/qwen3-vl-30b-a3b-thinking", + "display_name": "qwen/qwen3-vl-30b-a3b-thinking", "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 2, - "output": 0 - }, "type": "chat" }, { - "id": "gpt-4o-audio-preview", - "name": "gpt-4o-audio-preview", - "display_name": "gpt-4o-audio-preview", - "modalities": { - "input": [ - "text", - "audio" - ] - }, + "id": "qwen/qwen3-vl-32b-instruct", + "name": "qwen/qwen3-vl-32b-instruct", + "display_name": "qwen/qwen3-vl-32b-instruct", "limit": { - "context": 128000, - "output": 128000 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 2.5, - "output": 10 - }, "type": "chat" }, { - "id": "gpt-4o-mini-audio-preview", - "name": "gpt-4o-mini-audio-preview", - "display_name": "gpt-4o-mini-audio-preview", - "modalities": { - "input": [ - "text", - "audio" - ] - }, + "id": "qwen/qwen3-vl-8b-instruct", + "name": "qwen/qwen3-vl-8b-instruct", + "display_name": "qwen/qwen3-vl-8b-instruct", "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 0.15, - "output": 0.6 - }, "type": "chat" }, { - "id": "minimax-m2.1", - "name": "minimax-m2.1", - "display_name": "minimax-m2.1", + "id": "qwen/qwen3-vl-8b-thinking", + "name": "qwen/qwen3-vl-8b-thinking", + "display_name": "qwen/qwen3-vl-8b-thinking", "limit": { - "context": 204800, - "output": 204800 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 0.288, - "output": 1.152 - }, "type": "chat" }, { - "id": "cc-glm-4.7", - "name": "cc-glm-4.7", - "display_name": "cc-glm-4.7", + "id": "qwen/qwq-32b", + "name": "qwen/qwq-32b", + "display_name": "qwen/qwq-32b", "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 0.06, - "output": 0.22 - }, "type": "chat" }, { - "id": "cc-minimax-m2.1", - "name": "cc-minimax-m2.1", - "display_name": "cc-minimax-m2.1", - "modalities": { - "input": [ - "text" - ] - }, + "id": "x-ai/grok-3", + "name": "x-ai/grok-3", + "display_name": "x-ai/grok-3", "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 0.1, - "output": 0.1 - }, "type": "chat" }, { - "id": "coding-glm-4.7", - "name": "coding-glm-4.7", - "display_name": "coding-glm-4.7", - "modalities": { - "input": [ - "text" - ] - }, + "id": "x-ai/grok-3-beta", + "name": "x-ai/grok-3-beta", + "display_name": "x-ai/grok-3-beta", "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 0.06, - "output": 0.22, - "cache_read": 0.010998 + "supported": false }, "type": "chat" }, { - "id": "coding-minimax-m2.1", - "name": "coding-minimax-m2.1", - "display_name": "coding-minimax-m2.1", - "modalities": { - "input": [ - "text" - ] - }, + "id": "x-ai/grok-3-mini", + "name": "x-ai/grok-3-mini", + "display_name": "x-ai/grok-3-mini", "limit": { - "context": 204800, - "output": 204800 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 0.2, - "output": 0.2 + "supported": false }, "type": "chat" }, { - "id": "coding-minimax-m2.1-free", - "name": "coding-minimax-m2.1-free", - "display_name": "coding-minimax-m2.1-free", + "id": "x-ai/grok-3-mini-beta", + "name": "x-ai/grok-3-mini-beta", + "display_name": "x-ai/grok-3-mini-beta", "limit": { - "context": 204800, - "output": 204800 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "cc-glm-4.6", - "name": "cc-glm-4.6", - "display_name": "cc-glm-4.6", + "id": "x-ai/grok-4", + "name": "x-ai/grok-4", + "display_name": "x-ai/grok-4", "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 0.06, - "output": 0.22 - }, "type": "chat" }, { - "id": "coding-glm-4.6", - "name": "coding-glm-4.6", - "display_name": "coding-glm-4.6", - "modalities": { - "input": [ - "text" - ] - }, + "id": "x-ai/grok-4-fast", + "name": "x-ai/grok-4-fast", + "display_name": "x-ai/grok-4-fast", "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 0.06, - "output": 0.22, - "cache_read": 0.010998 + "supported": false }, "type": "chat" }, { - "id": "coding-glm-4.6-free", - "name": "coding-glm-4.6-free", - "display_name": "coding-glm-4.6-free", - "modalities": { - "input": [ - "text" - ] - }, + "id": "x-ai/grok-4.1-fast", + "name": "x-ai/grok-4.1-fast", + "display_name": "x-ai/grok-4.1-fast", "limit": { - "context": 200000, - "output": 200000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "supported": false }, "type": "chat" }, { - "id": "coding-minimax-m2", - "name": "coding-minimax-m2", - "display_name": "coding-minimax-m2", - "modalities": { - "input": [ - "text" - ] - }, + "id": "x-ai/grok-code-fast-1", + "name": "x-ai/grok-code-fast-1", + "display_name": "x-ai/grok-code-fast-1", "limit": { - "context": 204800, - "output": 204800 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 0.2, - "output": 0.2 + "supported": false }, "type": "chat" }, { - "id": "coding-minimax-m2-free", - "name": "coding-minimax-m2-free", - "display_name": "coding-minimax-m2-free", - "modalities": { - "input": [ - "text" - ] - }, + "id": "z-ai/glm-4-32b", + "name": "z-ai/glm-4-32b", + "display_name": "z-ai/glm-4-32b", "limit": { - "context": 204800, - "output": 204800 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "supported": false }, "type": "chat" }, { - "id": "o3-pro", - "name": "o3-pro", - "display_name": "o3-pro", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "z-ai/glm-4.5", + "name": "z-ai/glm-4.5", + "display_name": "z-ai/glm-4.5", "limit": { - "context": 200000, - "output": 200000 + "context": 4096, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 20, - "output": 80, - "cache_read": 20 + "supported": false }, "type": "chat" }, { - "id": "wan2.2-i2v-plus", - "name": "wan2.2-i2v-plus", - "display_name": "wan2.2-i2v-plus", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "z-ai/glm-4.5-air", + "name": "z-ai/glm-4.5-air", + "display_name": "z-ai/glm-4.5-air", "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 2, - "output": 0 - }, "type": "chat" }, { - "id": "wan2.2-t2v-plus", - "name": "wan2.2-t2v-plus", - "display_name": "wan2.2-t2v-plus", - "modalities": { - "input": [ - "text" - ] - }, + "id": "z-ai/glm-4.5v", + "name": "z-ai/glm-4.5v", + "display_name": "z-ai/glm-4.5v", "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 2, - "output": 0 - }, "type": "chat" }, { - "id": "wan2.5-i2v-preview", - "name": "wan2.5-i2v-preview", - "display_name": "wan2.5-i2v-preview", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "z-ai/glm-4.6", + "name": "z-ai/glm-4.6", + "display_name": "z-ai/glm-4.6", "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 2, - "output": 0 - }, "type": "chat" }, { - "id": "wan2.5-t2v-preview", - "name": "wan2.5-t2v-preview", - "display_name": "wan2.5-t2v-preview", - "modalities": { - "input": [ - "text" - ] - }, + "id": "z-ai/glm-4.6v", + "name": "z-ai/glm-4.6v", + "display_name": "z-ai/glm-4.6v", "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 2, - "output": 0 - }, "type": "chat" }, { - "id": "web-sora-2", - "name": "web-sora-2", - "display_name": "web-sora-2", + "id": "z-ai/glm-4.7", + "name": "z-ai/glm-4.7", + "display_name": "z-ai/glm-4.7", "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 2, - "output": 2 - }, "type": "chat" }, { - "id": "web-sora-2-pro", - "name": "web-sora-2-pro", - "display_name": "web-sora-2-pro", + "id": "z-ai/glm-4.7-flash", + "name": "z-ai/glm-4.7-flash", + "display_name": "z-ai/glm-4.7-flash", "limit": { - "context": 8192, - "output": 8192 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 2, - "output": 2 - }, "type": "chat" - }, + } + ] + }, + "aihubmix": { + "id": "aihubmix", + "name": "AIHubMix", + "display_name": "AIHubMix", + "models": [ { - "id": "flux-2-flex", - "name": "flux-2-flex", - "display_name": "flux-2-flex", + "id": "claude-opus-4-6", + "name": "claude-opus-4-6", + "display_name": "claude-opus-4-6", "modalities": { "input": [ "text", @@ -73666,56 +84564,56 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 200000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 2, - "output": 0, - "cache_read": 0 + "input": 5, + "output": 25, + "cache_read": 0.5 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "flux-2-pro", - "name": "flux-2-pro", - "display_name": "flux-2-pro", + "id": "claude-opus-4-6-think", + "name": "claude-opus-4-6-think", + "display_name": "claude-opus-4-6-think", "modalities": { "input": [ - "text", - "image" + "image", + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 200000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 2, - "output": 0, - "cache_read": 0 + "input": 5, + "output": 25, + "cache_read": 0.5 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "gemini-2.5-pro", - "display_name": "gemini-2.5-pro", + "id": "gemini-3-flash-preview", + "name": "gemini-3-flash-preview", + "display_name": "gemini-3-flash-preview", "modalities": { "input": [ "text", "image", - "audio", - "video", - "pdf" + "audio" ] }, "limit": { @@ -73728,30 +84626,57 @@ "default": true }, "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.5, + "output": 3, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "glm-4.6", - "name": "glm-4.6", - "display_name": "glm-4.6", + "id": "gemini-3-flash-preview-search", + "name": "gemini-3-flash-preview-search", + "display_name": "gemini-3-flash-preview-search", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ] }, "limit": { - "context": 204800, - "output": 204800 + "context": 1048576, + "output": 1048576 }, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "cost": { + "input": 0.5, + "output": 3, + "cache_read": 0.05 + }, + "type": "chat" + }, + { + "id": "step-3.5-flash-free", + "name": "step-3.5-flash-free", + "display_name": "step-3.5-flash-free", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, "cost": { "input": 0, "output": 0, @@ -73760,120 +84685,129 @@ "type": "chat" }, { - "id": "glm-4.6v", - "name": "glm-4.6v", - "display_name": "glm-4.6v", + "id": "claude-opus-4-5", + "name": "claude-opus-4-5", + "display_name": "claude-opus-4-5", "modalities": { "input": [ "text", - "image", - "video" + "image" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 200000, + "output": 200000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.137, - "output": 0.411, - "cache_read": 0.0274 + "input": 5, + "output": 25, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "jimeng-3.0-1080p", - "name": "jimeng-3.0-1080p", - "display_name": "jimeng-3.0-1080p", + "id": "claude-opus-4-5-think", + "name": "claude-opus-4-5-think", + "display_name": "claude-opus-4-5-think", "modalities": { "input": [ - "text", - "image" + "image", + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 200000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 2, - "output": 0 + "input": 5, + "output": 25, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "jimeng-3.0-720p", - "name": "jimeng-3.0-720p", - "display_name": "jimeng-3.0-720p", + "id": "gemini-3-flash-preview-free", + "name": "gemini-3-flash-preview-free", + "display_name": "gemini-3-flash-preview-free", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1048576, + "output": 1048576 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 2, - "output": 0 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "jimeng-3.0-pro", - "name": "jimeng-3.0-pro", - "display_name": "jimeng-3.0-pro", + "id": "glm-4.7", + "name": "glm-4.7", + "display_name": "glm-4.7", "modalities": { "input": [ - "text", - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 200000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 2, - "output": 0 + "input": 0.273974, + "output": 1.095896, + "cache_read": 0.054795 }, "type": "chat" }, { - "id": "kimi-for-coding-free", - "name": "kimi-for-coding-free", - "display_name": "kimi-for-coding-free", + "id": "gemini-2.0-flash-free", + "name": "gemini-2.0-flash-free", + "display_name": "gemini-2.0-flash-free", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 1048576, + "output": 1048576 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "cost": { "input": 0, @@ -73883,21 +84817,17 @@ "type": "chat" }, { - "id": "gemini-2.5-pro-search", - "name": "gemini-2.5-pro-search", - "display_name": "gemini-2.5-pro-search", + "id": "glm-4.7-flash-free", + "name": "glm-4.7-flash-free", + "display_name": "glm-4.7-flash-free", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ] }, "limit": { - "context": 1048576, - "output": 1048576 + "context": 8192, + "output": 8192 }, "tool_call": true, "reasoning": { @@ -73905,24 +84835,24 @@ "default": true }, "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "kimi-k2-thinking", - "display_name": "kimi-k2-thinking", + "id": "coding-glm-4.7-free", + "name": "coding-glm-4.7-free", + "display_name": "coding-glm-4.7-free", "modalities": { "input": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 8192, + "output": 8192 }, "tool_call": true, "reasoning": { @@ -73930,62 +84860,67 @@ "default": true }, "cost": { - "input": 0.548, - "output": 2.192, - "cache_read": 0.137 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "Kimi-K2-0905", - "name": "Kimi-K2-0905", - "display_name": "Kimi-K2-0905", + "id": "gemini-3-pro-image-preview", + "name": "gemini-3-pro-image-preview", + "display_name": "gemini-3-pro-image-preview", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.548, - "output": 2.192 + "input": 2, + "output": 12, + "cache_read": 2 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "DeepSeek-V3.1-Fast", - "name": "DeepSeek-V3.1-Fast", - "display_name": "DeepSeek-V3.1-Fast", + "id": "gpt-5.2-codex", + "name": "gpt-5.2-codex", + "display_name": "gpt-5.2-codex", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { - "context": 163000, - "output": 163000 + "context": 400000, + "output": 400000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 1.096, - "output": 3.288 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "claude-opus-4-0", - "name": "claude-opus-4-0", - "display_name": "claude-opus-4-0", + "id": "gpt-image-1.5", + "name": "gpt-image-1.5", + "display_name": "gpt-image-1.5", "modalities": { "input": [ "text", @@ -73993,23 +84928,24 @@ ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 16.5, - "output": 82.5 + "input": 5, + "output": 10, + "cache_read": 5 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "claude-sonnet-4-0", - "name": "claude-sonnet-4-0", - "display_name": "claude-sonnet-4-0", + "id": "gpt-5.2", + "name": "gpt-5.2", + "display_name": "gpt-5.2", "modalities": { "input": [ "text", @@ -74017,8 +84953,8 @@ ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 400000, + "output": 400000 }, "tool_call": true, "reasoning": { @@ -74026,96 +84962,93 @@ "default": true }, "cost": { - "input": 3.3, - "output": 16.5, - "cache_read": 0.33 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "gemini-2.5-flash", - "display_name": "gemini-2.5-flash", + "id": "gpt-5.2-chat-latest", + "name": "gpt-5.2-chat-latest", + "display_name": "gpt-5.2-chat-latest", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ] }, "limit": { - "context": 1048576, - "output": 1048576 + "context": 128000, + "output": 128000 }, "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.3, - "output": 2.499, - "cache_read": 0.03 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-09-2025", - "name": "gemini-2.5-flash-preview-09-2025", - "display_name": "gemini-2.5-flash-preview-09-2025", + "id": "gpt-5.2-high", + "name": "gpt-5.2-high", + "display_name": "gpt-5.2-high", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ] }, "limit": { - "context": 1048576, - "output": 1048576 + "context": 400000, + "output": 400000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.3, - "output": 2.499, - "cache_read": 0.03 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "glm-4.5v", - "name": "glm-4.5v", - "display_name": "glm-4.5v", + "id": "gpt-5.2-low", + "name": "gpt-5.2-low", + "display_name": "gpt-5.2-low", "modalities": { "input": [ "text", - "image", - "video" + "image" ] }, "limit": { - "context": 64000, - "output": 64000 + "context": 400000, + "output": 400000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.274, - "output": 0.822, - "cache_read": 0.274 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite", - "name": "gemini-2.5-flash-lite", - "display_name": "gemini-2.5-flash-lite", + "id": "gemini-3-pro-preview", + "name": "gemini-3-pro-preview", + "display_name": "gemini-3-pro-preview", "modalities": { "input": [ "text", @@ -74125,105 +85058,103 @@ ] }, "limit": { - "context": 1048576, - "output": 1048576 + "context": 8192, + "output": 8192 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.01 + "input": 2, + "output": 12, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite-preview-09-2025", - "name": "gemini-2.5-flash-lite-preview-09-2025", - "display_name": "gemini-2.5-flash-lite-preview-09-2025", + "id": "gpt-5.2-pro", + "name": "gpt-5.2-pro", + "display_name": "gpt-5.2-pro", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ] }, "limit": { - "context": 1048576, - "output": 1048576 + "context": 400000, + "output": 400000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.01 + "input": 21, + "output": 168, + "cache_read": 2.1 }, "type": "chat" }, { - "id": "gemini-2.5-flash-nothink", - "name": "gemini-2.5-flash-nothink", - "display_name": "gemini-2.5-flash-nothink", + "id": "gpt-5.1", + "name": "gpt-5.1", + "display_name": "gpt-5.1", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ] }, "limit": { - "context": 1047576, - "output": 1047576 + "context": 400000, + "output": 400000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.3, - "output": 2.499, - "cache_read": 0.03 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "gemini-2.5-flash-search", - "name": "gemini-2.5-flash-search", - "display_name": "gemini-2.5-flash-search", + "id": "gpt-5.1-codex-max", + "name": "gpt-5.1-codex-max", + "display_name": "gpt-5.1-codex-max", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ] }, "limit": { - "context": 1048576, - "output": 1048576 + "context": 400000, + "output": 400000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.3, - "output": 2.499, - "cache_read": 0.03 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-05-20-nothink", - "name": "gemini-2.5-flash-preview-05-20-nothink", - "display_name": "gemini-2.5-flash-preview-05-20-nothink", + "id": "gemini-3-pro-preview-search", + "name": "gemini-3-pro-preview-search", + "display_name": "gemini-3-pro-preview-search", "modalities": { "input": [ "text", @@ -74233,116 +85164,129 @@ ] }, "limit": { - "context": 1048576, - "output": 1048576 + "context": 8192, + "output": 8192 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.3, - "output": 2.499, - "cache_read": 0.03 + "input": 2, + "output": 12, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-05-20-search", - "name": "gemini-2.5-flash-preview-05-20-search", - "display_name": "gemini-2.5-flash-preview-05-20-search", + "id": "gpt-5.1-chat-latest", + "name": "gpt-5.1-chat-latest", + "display_name": "gpt-5.1-chat-latest", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ] }, "limit": { - "context": 1048576, - "output": 1048576 + "context": 128000, + "output": 128000 }, "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.3, - "output": 2.499, - "cache_read": 0.03 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "DeepSeek-V3-Fast", - "name": "DeepSeek-V3-Fast", - "display_name": "DeepSeek-V3-Fast", + "id": "gpt-5.1-codex", + "name": "gpt-5.1-codex", + "display_name": "gpt-5.1-codex", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 400000, + "output": 400000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.56, - "output": 2.24 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "veo-2.0-generate-001", - "name": "veo-2.0-generate-001", - "display_name": "veo-2.0-generate-001", + "id": "gpt-5.1-codex-mini", + "name": "gpt-5.1-codex-mini", + "display_name": "gpt-5.1-codex-mini", "modalities": { "input": [ - "video" + "text", + "image" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 400000, + "output": 400000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 2, + "input": 0.25, "output": 2, - "cache_read": 0 + "cache_read": 0.025 }, "type": "chat" }, { - "id": "veo3.1", - "name": "veo3.1", - "display_name": "veo3.1", + "id": "doubao-seed-1-8", + "name": "doubao-seed-1-8", + "display_name": "doubao-seed-1-8", + "modalities": { + "input": [ + "text", + "image", + "video" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 256000, + "output": 256000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 200, - "output": 200 + "input": 0.10959, + "output": 0.273975, + "cache_read": 0.021918 }, "type": "chat" }, { - "id": "imagen-4.0", - "name": "imagen-4.0", - "display_name": "imagen-4.0", + "id": "claude-haiku-4-5", + "name": "claude-haiku-4-5", + "display_name": "claude-haiku-4-5", "modalities": { "input": [ "text", @@ -74350,24 +85294,25 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 204800, + "output": 204800 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 2, - "output": 2, - "cache_read": 0 + "input": 1.1, + "output": 5.5, + "cache_read": 0.11 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "imagen-4.0-fast-generate-001", - "name": "imagen-4.0-fast-generate-001", - "display_name": "imagen-4.0-fast-generate-001", + "id": "claude-sonnet-4-5", + "name": "claude-sonnet-4-5", + "display_name": "claude-sonnet-4-5", "modalities": { "input": [ "text", @@ -74375,23 +85320,25 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1000000, + "output": 1000000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 2, - "output": 2 + "input": 3.3, + "output": 16.5, + "cache_read": 0.33 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "imagen-4.0-fast-generate-preview-06-06", - "name": "imagen-4.0-fast-generate-preview-06-06", - "display_name": "imagen-4.0-fast-generate-preview-06-06", + "id": "claude-sonnet-4-5-think", + "name": "claude-sonnet-4-5-think", + "display_name": "claude-sonnet-4-5-think", "modalities": { "input": [ "text", @@ -74399,23 +85346,25 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1000000, + "output": 1000000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 2, - "output": 2 + "input": 3.3, + "output": 16.5, + "cache_read": 0.33 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "imagen-4.0-generate-001", - "name": "imagen-4.0-generate-001", - "display_name": "imagen-4.0-generate-001", + "id": "mistral-large-3", + "name": "mistral-large-3", + "display_name": "mistral-large-3", "modalities": { "input": [ "text", @@ -74423,23 +85372,23 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 256000, + "output": 256000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 2, - "output": 2 + "input": 0.5, + "output": 1.5 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "imagen-4.0-ultra-generate-001", - "name": "imagen-4.0-ultra-generate-001", - "display_name": "imagen-4.0-ultra-generate-001", + "id": "web-gpt-image-1.5", + "name": "web-gpt-image-1.5", + "display_name": "web-gpt-image-1.5", "modalities": { "input": [ "text", @@ -74455,40 +85404,41 @@ "supported": false }, "cost": { - "input": 2, - "output": 2 + "input": 3, + "output": 3, + "cache_read": 0 }, "type": "imageGeneration" }, { - "id": "imagen-4.0-ultra", - "name": "imagen-4.0-ultra", - "display_name": "imagen-4.0-ultra", + "id": "gemini-2.5-flash-image", + "name": "gemini-2.5-flash-image", + "display_name": "gemini-2.5-flash-image", "modalities": { "input": [ - "text", - "image" + "image", + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 32800, + "output": 32800 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 2, - "output": 2, - "cache_read": 0 + "input": 0.3, + "output": 2.499, + "cache_read": 0.3 }, "type": "imageGeneration" }, { - "id": "gpt-image-1", - "name": "gpt-image-1", - "display_name": "gpt-image-1", + "id": "grok-4-1-fast-non-reasoning", + "name": "grok-4-1-fast-non-reasoning", + "display_name": "grok-4-1-fast-non-reasoning", "modalities": { "input": [ "text", @@ -74496,24 +85446,24 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 2000000, + "output": 2000000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 5, - "output": 40, - "cache_read": 5 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "gpt-image-1-mini", - "name": "gpt-image-1-mini", - "display_name": "gpt-image-1-mini", + "id": "grok-4-1-fast-reasoning", + "name": "grok-4-1-fast-reasoning", + "display_name": "grok-4-1-fast-reasoning", "modalities": { "input": [ "text", @@ -74521,24 +85471,25 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 2000000, + "output": 2000000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 5, - "output": 40, - "cache_read": 5 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "grok-code-fast-1", + "name": "grok-code-fast-1", + "display_name": "grok-code-fast-1", "modalities": { "input": [ "text", @@ -74546,8 +85497,8 @@ ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 256000, + "output": 256000 }, "tool_call": true, "reasoning": { @@ -74555,16 +85506,21 @@ "default": true }, "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.275 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "paddleocr-vl-0.9b", - "name": "paddleocr-vl-0.9b", - "display_name": "paddleocr-vl-0.9b", + "id": "mimo-v2-flash", + "name": "mimo-v2-flash", + "display_name": "mimo-v2-flash", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -74574,114 +85530,117 @@ "supported": false }, "cost": { - "input": 2, - "output": 0 + "input": 0.1918, + "output": 0.5754, + "cache_read": 0.03836 }, "type": "chat" }, { - "id": "pp-structurev3", - "name": "pp-structurev3", - "display_name": "pp-structurev3", + "id": "gpt-5", + "name": "gpt-5", + "display_name": "gpt-5", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 400000, + "output": 400000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 2, - "output": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "qwen3-vl-235b-a22b-instruct", - "name": "qwen3-vl-235b-a22b-instruct", - "display_name": "qwen3-vl-235b-a22b-instruct", + "id": "deepseek-v3.2-fast", + "name": "deepseek-v3.2-fast", + "display_name": "deepseek-v3.2-fast", "modalities": { "input": [ - "text", - "image", - "video" + "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 128000, + "output": 128000 }, "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.274, - "output": 1.096 + "input": 1.096, + "output": 3.288, + "cache_read": 1.096 }, "type": "chat" }, { - "id": "qwen3-vl-235b-a22b-thinking", - "name": "qwen3-vl-235b-a22b-thinking", - "display_name": "qwen3-vl-235b-a22b-thinking", + "id": "deepseek-v3.2", + "name": "deepseek-v3.2", + "display_name": "deepseek-v3.2", "modalities": { "input": [ - "text", - "image", - "video" + "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 128000, + "output": 128000 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "cost": { - "input": 0.274, - "output": 2.74 + "input": 0.302, + "output": 0.453, + "cache_read": 0.0302 }, "type": "chat" }, { - "id": "qwen3-vl-30b-a3b-instruct", - "name": "qwen3-vl-30b-a3b-instruct", - "display_name": "qwen3-vl-30b-a3b-instruct", + "id": "deepseek-v3.2-speciale", + "name": "deepseek-v3.2-speciale", + "display_name": "deepseek-v3.2-speciale", "modalities": { "input": [ - "text", - "image", - "video" + "text" ] }, "limit": { "context": 128000, "output": 128000 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.1028, - "output": 0.4112 + "input": 0.58, + "output": 1.680028 }, "type": "chat" }, { - "id": "qwen3-vl-30b-a3b-thinking", - "name": "qwen3-vl-30b-a3b-thinking", - "display_name": "qwen3-vl-30b-a3b-thinking", + "id": "deepseek-v3.2-think", + "name": "deepseek-v3.2-think", + "display_name": "deepseek-v3.2-think", "modalities": { "input": [ - "text", - "image", - "video" + "text" ] }, "limit": { @@ -74690,163 +85649,166 @@ }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "cost": { - "input": 0.1028, - "output": 1.028 + "input": 0.302, + "output": 0.453, + "cache_read": 0.0302 }, "type": "chat" }, { - "id": "veo-3.0-generate-preview", - "name": "veo-3.0-generate-preview", - "display_name": "veo-3.0-generate-preview", + "id": "deepseek-math-v2", + "name": "deepseek-math-v2", + "display_name": "deepseek-math-v2", "modalities": { "input": [ - "text", - "image", - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 163000, + "output": 163000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 2, - "output": 2, - "cache_read": 0 + "input": 0.492, + "output": 1.968, + "cache_read": 0.0984 }, "type": "chat" }, { - "id": "veo-3.1-fast-generate-preview", - "name": "veo-3.1-fast-generate-preview", - "display_name": "veo-3.1-fast-generate-preview", + "id": "DeepSeek-V3.2-Exp", + "name": "DeepSeek-V3.2-Exp", + "display_name": "DeepSeek-V3.2-Exp", "modalities": { "input": [ - "text", - "image", - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 163000, + "output": 163000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 2, - "output": 0 + "input": 0.274, + "output": 0.411, + "cache_read": 0.0274 }, "type": "chat" }, { - "id": "veo-3.1-generate-preview", - "name": "veo-3.1-generate-preview", - "display_name": "veo-3.1-generate-preview", + "id": "DeepSeek-V3.2-Exp-Think", + "name": "DeepSeek-V3.2-Exp-Think", + "display_name": "DeepSeek-V3.2-Exp-Think", "modalities": { "input": [ - "text", - "image", - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131000, + "output": 131000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 2, - "output": 2, - "cache_read": 0 + "input": 0.274, + "output": 0.411, + "cache_read": 0.0274 }, "type": "chat" }, { - "id": "flux-kontext-max", - "name": "flux-kontext-max", - "display_name": "flux-kontext-max", + "id": "gpt-5-codex", + "name": "gpt-5-codex", + "display_name": "gpt-5-codex", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 400000, + "output": 400000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 2, - "output": 0, - "cache_read": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "gemini-2.5-flash-image-preview", - "name": "gemini-2.5-flash-image-preview", - "display_name": "gemini-2.5-flash-image-preview", + "id": "DeepSeek-V3.1-Terminus", + "name": "DeepSeek-V3.1-Terminus", + "display_name": "DeepSeek-V3.1-Terminus", "modalities": { "input": [ - "image", "text" ] }, "limit": { - "context": 32800, - "output": 32800 + "context": 160000, + "output": 160000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.3 + "input": 0.56, + "output": 1.68 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "glm-4.5", - "name": "glm-4.5", - "display_name": "glm-4.5", + "id": "DeepSeek-V3.1-Think", + "name": "DeepSeek-V3.1-Think", + "display_name": "DeepSeek-V3.1-Think", "modalities": { "input": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.4, - "output": 1.6 + "input": 0.56, + "output": 1.68 }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "gpt-4.1", - "display_name": "gpt-4.1", + "id": "gpt-5-pro", + "name": "gpt-5-pro", + "display_name": "gpt-5-pro", "modalities": { "input": [ "text", @@ -74854,194 +85816,242 @@ ] }, "limit": { - "context": 1047576, - "output": 1047576 + "context": 400000, + "output": 400000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "grok-4", - "name": "grok-4", - "display_name": "grok-4", + "id": "gpt-5-mini", + "name": "gpt-5-mini", + "display_name": "gpt-5-mini", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { - "context": 256000, - "output": 256000 + "context": 400000, + "output": 400000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 3.3, - "output": 16.5, - "cache_read": 0.825 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "grok-4-fast-non-reasoning", - "name": "grok-4-fast-non-reasoning", - "display_name": "grok-4-fast-non-reasoning", + "id": "gpt-5-nano", + "name": "gpt-5-nano", + "display_name": "gpt-5-nano", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 400000, + "output": 400000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "grok-4-fast-reasoning", - "name": "grok-4-fast-reasoning", - "display_name": "grok-4-fast-reasoning", + "id": "gpt-5-chat-latest", + "name": "gpt-5-chat-latest", + "display_name": "gpt-5-chat-latest", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 400000, + "output": 400000 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "kimi-k2-0711", - "name": "kimi-k2-0711", - "display_name": "kimi-k2-0711", + "id": "claude-opus-4-1", + "name": "claude-opus-4-1", + "display_name": "claude-opus-4-1", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 200000, + "output": 200000 }, "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "cost": { + "input": 16.5, + "output": 82.5 + }, + "type": "chat" + }, + { + "id": "o3-deep-research", + "name": "o3-deep-research", + "display_name": "o3-deep-research", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.54, - "output": 2.16 + "input": 10, + "output": 40, + "cache_read": 2.5 }, "type": "chat" }, { - "id": "kimi-k2-turbo-preview", - "name": "kimi-k2-turbo-preview", - "display_name": "kimi-k2-turbo-preview", + "id": "qwen3-max-2026-01-23", + "name": "qwen3-max-2026-01-23", + "display_name": "qwen3-max-2026-01-23", "modalities": { "input": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 252000, + "output": 252000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 1.2, - "output": 4.8, - "cache_read": 0.3 + "input": 0.34246, + "output": 1.36984, + "cache_read": 0.34246 }, "type": "chat" }, - { - "id": "DeepSeek-OCR", - "name": "DeepSeek-OCR", - "display_name": "DeepSeek-OCR", + { + "id": "kimi-k2.5", + "name": "kimi-k2.5", + "display_name": "kimi-k2.5", "modalities": { "input": [ "text", - "image" + "image", + "video" ] }, "limit": { - "context": 8000, - "output": 8000 + "context": 256000, + "output": 256000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.02, - "output": 0.02 + "input": 0.6, + "output": 3, + "cache_read": 0.105 }, "type": "chat" }, { - "id": "deepseek-ocr", - "name": "deepseek-ocr", - "display_name": "deepseek-ocr", + "id": "qwen3-vl-flash", + "name": "qwen3-vl-flash", + "display_name": "qwen3-vl-flash", "modalities": { "input": [ "text", - "image" + "image", + "video" ] }, "limit": { - "context": 8000, - "output": 8000 + "context": 254000, + "output": 254000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.02, - "output": 0.02 + "input": 0.0206, + "output": 0.206, + "cache_read": 0.00412 }, "type": "chat" }, { - "id": "aihubmix-router", - "name": "aihubmix-router", - "display_name": "aihubmix-router", + "id": "qwen3-vl-flash-2026-01-22", + "name": "qwen3-vl-flash-2026-01-22", + "display_name": "qwen3-vl-flash-2026-01-22", "modalities": { "input": [ "text", - "image" + "image", + "video" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 254000, + "output": 254000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 0.0206, + "output": 0.206, + "cache_read": 0.0206 }, "type": "chat" }, @@ -75072,147 +86082,114 @@ "type": "chat" }, { - "id": "gpt-4.1-mini", - "name": "gpt-4.1-mini", - "display_name": "gpt-4.1-mini", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "sora-2", + "name": "sora-2", + "display_name": "sora-2", "limit": { - "context": 1047576, - "output": 1047576 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "gpt-4.1-nano", - "name": "gpt-4.1-nano", - "display_name": "gpt-4.1-nano", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "sora-2-pro", + "name": "sora-2-pro", + "display_name": "sora-2-pro", "limit": { - "context": 1047576, - "output": 1047576 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "gemini-2.5-pro-preview-05-06", - "name": "gemini-2.5-pro-preview-05-06", - "display_name": "gemini-2.5-pro-preview-05-06", + "id": "doubao-seedream-4-5", + "name": "doubao-seedream-4-5", + "display_name": "doubao-seedream-4-5", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ] }, "limit": { - "context": 1048576, - "output": 1048576 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 2, + "output": 0, + "cache_read": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "gemini-2.5-pro-preview-03-25", - "name": "gemini-2.5-pro-preview-03-25", - "display_name": "gemini-2.5-pro-preview-03-25", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "cc-glm-4.7", + "name": "cc-glm-4.7", + "display_name": "cc-glm-4.7", "limit": { "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.06, + "output": 0.22 }, "type": "chat" }, { - "id": "gemini-2.5-pro-preview-05-06-search", - "name": "gemini-2.5-pro-preview-05-06-search", - "display_name": "gemini-2.5-pro-preview-05-06-search", + "id": "cc-minimax-m2.1", + "name": "cc-minimax-m2.1", + "display_name": "cc-minimax-m2.1", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ] }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "gemini-2.5-pro-preview-03-25-search", - "name": "gemini-2.5-pro-preview-03-25-search", - "display_name": "gemini-2.5-pro-preview-03-25-search", + "id": "coding-glm-4.7", + "name": "coding-glm-4.7", + "display_name": "coding-glm-4.7", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ] }, "limit": { @@ -75225,139 +86202,124 @@ "default": true }, "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.06, + "output": 0.22, + "cache_read": 0.010998 }, "type": "chat" }, { - "id": "qwen3-max-preview", - "name": "qwen3-max-preview", - "display_name": "qwen3-max-preview", + "id": "coding-minimax-m2.1", + "name": "coding-minimax-m2.1", + "display_name": "coding-minimax-m2.1", "modalities": { "input": [ - "text", - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 204800, + "output": 204800 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.822, - "output": 3.288, - "cache_read": 0.822 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "qwen3-max", - "name": "qwen3-max", - "display_name": "qwen3-max", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "coding-minimax-m2.1-free", + "name": "coding-minimax-m2.1-free", + "display_name": "coding-minimax-m2.1-free", "limit": { - "context": 262144, - "output": 262144 + "context": 204800, + "output": 204800 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.822, - "output": 3.288, - "cache_read": 0.822 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-instruct", - "name": "qwen3-next-80b-a3b-instruct", - "display_name": "qwen3-next-80b-a3b-instruct", + "id": "gpt-4o-audio-preview", + "name": "gpt-4o-audio-preview", + "display_name": "gpt-4o-audio-preview", "modalities": { "input": [ "text", - "image" + "audio" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 128000, + "output": 128000 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.138, - "output": 0.552 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-thinking", - "name": "qwen3-next-80b-a3b-thinking", - "display_name": "qwen3-next-80b-a3b-thinking", + "id": "gpt-4o-mini-audio-preview", + "name": "gpt-4o-mini-audio-preview", + "display_name": "gpt-4o-mini-audio-preview", "modalities": { "input": [ "text", - "image" + "audio" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "cost": { - "input": 0.138, - "output": 1.38 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "qwen3-235b-a22b-instruct-2507", - "display_name": "qwen3-235b-a22b-instruct-2507", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "minimax-m2.1", + "name": "minimax-m2.1", + "display_name": "minimax-m2.1", "limit": { - "context": 262144, - "output": 262144 + "context": 204800, + "output": 204800 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.28, - "output": 1.12 + "input": 0.288, + "output": 1.152 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-thinking-2507", - "name": "qwen3-235b-a22b-thinking-2507", - "display_name": "qwen3-235b-a22b-thinking-2507", + "id": "o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ "text", @@ -75365,8 +86327,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 200000 }, "tool_call": true, "reasoning": { @@ -75374,63 +86336,63 @@ "default": true }, "cost": { - "input": 0.28, - "output": 2.8 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "qwen3-coder-30b-a3b-instruct", - "display_name": "qwen3-coder-30b-a3b-instruct", + "id": "wan2.6-i2v", + "name": "wan2.6-i2v", + "display_name": "wan2.6-i2v", "modalities": { "input": [ + "image", "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.2, - "output": 0.8, - "cache_read": 0.2 + "input": 2, + "output": 0 }, "type": "chat" }, { - "id": "qwen3-coder-480b-a35b-instruct", - "name": "qwen3-coder-480b-a35b-instruct", - "display_name": "qwen3-coder-480b-a35b-instruct", + "id": "wan2.6-t2v", + "name": "wan2.6-t2v", + "display_name": "wan2.6-t2v", "modalities": { "input": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.82, - "output": 3.28, - "cache_read": 0.82 + "input": 2, + "output": 0 }, "type": "chat" }, { - "id": "qwen3-235b-a22b", - "name": "qwen3-235b-a22b", - "display_name": "qwen3-235b-a22b", + "id": "o3-pro", + "name": "o3-pro", + "display_name": "o3-pro", "modalities": { "input": [ "text", @@ -75438,118 +86400,125 @@ ] }, "limit": { - "context": 131100, - "output": 131100 + "context": 200000, + "output": 200000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.28, - "output": 1.12 + "input": 20, + "output": 80, + "cache_read": 20 }, "type": "chat" }, { - "id": "qwen3-coder-flash", - "name": "qwen3-coder-flash", - "display_name": "qwen3-coder-flash", + "id": "step-3.5-flash", + "name": "step-3.5-flash", + "display_name": "step-3.5-flash", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { "context": 256000, "output": 256000 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.136, - "output": 0.544, - "cache_read": 0.136 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "qwen3-coder-plus", - "name": "qwen3-coder-plus", - "display_name": "qwen3-coder-plus", + "id": "wan2.2-i2v-plus", + "name": "wan2.2-i2v-plus", + "display_name": "wan2.2-i2v-plus", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { - "context": 1048576, - "output": 1048576 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.54, - "output": 2.16, - "cache_read": 0.108 + "input": 2, + "output": 0 }, "type": "chat" }, { - "id": "qwen3-coder-plus-2025-07-22", - "name": "qwen3-coder-plus-2025-07-22", - "display_name": "qwen3-coder-plus-2025-07-22", + "id": "wan2.2-t2v-plus", + "name": "wan2.2-t2v-plus", + "display_name": "wan2.2-t2v-plus", "modalities": { "input": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.54, - "output": 2.16, - "cache_read": 0.54 + "input": 2, + "output": 0 }, "type": "chat" }, { - "id": "DeepSeek-V3", - "name": "DeepSeek-V3", - "display_name": "DeepSeek-V3", + "id": "wan2.5-i2v-preview", + "name": "wan2.5-i2v-preview", + "display_name": "wan2.5-i2v-preview", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { - "context": 1638000, - "output": 1638000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.272, - "output": 1.088 + "input": 2, + "output": 0 }, "type": "chat" }, { - "id": "LongCat-Flash-Chat", - "name": "LongCat-Flash-Chat", - "display_name": "LongCat-Flash-Chat", + "id": "wan2.5-t2v-preview", + "name": "wan2.5-t2v-preview", + "display_name": "wan2.5-t2v-preview", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -75559,49 +86528,33 @@ "supported": false }, "cost": { - "input": 0.14, - "output": 0.7 + "input": 2, + "output": 0 }, "type": "chat" }, { - "id": "gemini-2.5-pro-preview-06-05-search", - "name": "gemini-2.5-pro-preview-06-05-search", - "display_name": "gemini-2.5-pro-preview-06-05-search", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video" - ] - }, + "id": "web-sora-2", + "name": "web-sora-2", + "display_name": "web-sora-2", "limit": { "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "imagen-4.0-ultra-generate-exp-05-20", - "name": "imagen-4.0-ultra-generate-exp-05-20", - "display_name": "imagen-4.0-ultra-generate-exp-05-20", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "web-sora-2-pro", + "name": "web-sora-2-pro", + "display_name": "web-sora-2-pro", "limit": { "context": 8192, "output": 8192 @@ -75612,22 +86565,14 @@ }, "cost": { "input": 2, - "output": 2, - "cache_read": 0 + "output": 2 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "Qwen2.5-VL-72B-Instruct", - "name": "Qwen2.5-VL-72B-Instruct", - "display_name": "Qwen2.5-VL-72B-Instruct", - "modalities": { - "input": [ - "text", - "image", - "video" - ] - }, + "id": "cc-glm-4.6", + "name": "cc-glm-4.6", + "display_name": "cc-glm-4.6", "limit": { "context": 8192, "output": 8192 @@ -75637,23 +86582,23 @@ "supported": false }, "cost": { - "input": 0.62, - "output": 0.62 + "input": 0.06, + "output": 0.22 }, "type": "chat" }, { - "id": "ernie-5.0-thinking-preview", - "name": "ernie-5.0-thinking-preview", - "display_name": "ernie-5.0-thinking-preview", + "id": "coding-glm-4.6", + "name": "coding-glm-4.6", + "display_name": "coding-glm-4.6", "modalities": { "input": [ "text" ] }, "limit": { - "context": 183000, - "output": 183000 + "context": 8192, + "output": 8192 }, "tool_call": true, "reasoning": { @@ -75661,46 +86606,49 @@ "default": true }, "cost": { - "input": 0.822, - "output": 3.288 + "input": 0.06, + "output": 0.22, + "cache_read": 0.010998 }, "type": "chat" }, { - "id": "inclusionAI/Ling-1T", - "name": "inclusionAI/Ling-1T", - "display_name": "inclusionAI/Ling-1T", + "id": "coding-glm-4.6-free", + "name": "coding-glm-4.6-free", + "display_name": "coding-glm-4.6-free", "modalities": { "input": [ "text" ] }, - "limit": { - "context": 8192, - "output": 8192 + "limit": { + "context": 200000, + "output": 200000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.548, - "output": 2.192 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "inclusionAI/Ring-1T", - "name": "inclusionAI/Ring-1T", - "display_name": "inclusionAI/Ring-1T", + "id": "coding-minimax-m2", + "name": "coding-minimax-m2", + "display_name": "coding-minimax-m2", "modalities": { "input": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 204800, + "output": 204800 }, "tool_call": true, "reasoning": { @@ -75708,44 +86656,44 @@ "default": true }, "cost": { - "input": 0.548, - "output": 2.192 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "glm-4.5-x", - "name": "glm-4.5-x", - "display_name": "glm-4.5-x", + "id": "coding-minimax-m2-free", + "name": "coding-minimax-m2-free", + "display_name": "coding-minimax-m2-free", "modalities": { "input": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 204800, + "output": 204800 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 2.2, - "output": 8.91, - "cache_read": 0.44 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "gme-qwen2-vl-2b-instruct", - "name": "gme-qwen2-vl-2b-instruct", - "display_name": "gme-qwen2-vl-2b-instruct", + "id": "flux-2-flex", + "name": "flux-2-flex", + "display_name": "flux-2-flex", "modalities": { "input": [ "text", - "image", - "video" + "image" ] }, "limit": { @@ -75757,15 +86705,16 @@ "supported": false }, "cost": { - "input": 0.138, - "output": 0.138 + "input": 2, + "output": 0, + "cache_read": 0 }, - "type": "embedding" + "type": "imageGeneration" }, { - "id": "gte-rerank-v2", - "name": "gte-rerank-v2", - "display_name": "gte-rerank-v2", + "id": "flux-2-pro", + "name": "flux-2-pro", + "display_name": "flux-2-pro", "modalities": { "input": [ "text", @@ -75781,85 +86730,102 @@ "supported": false }, "cost": { - "input": 0.11, - "output": 0.11 + "input": 2, + "output": 0, + "cache_read": 0 }, - "type": "rerank" + "type": "imageGeneration" }, { - "id": "inclusionAI/Ling-flash-2.0", - "name": "inclusionAI/Ling-flash-2.0", - "display_name": "inclusionAI/Ling-flash-2.0", + "id": "gemini-2.5-pro", + "name": "gemini-2.5-pro", + "display_name": "gemini-2.5-pro", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1048576, + "output": 1048576 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.136, - "output": 0.544 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "inclusionAI/Ling-mini-2.0", - "name": "inclusionAI/Ling-mini-2.0", - "display_name": "inclusionAI/Ling-mini-2.0", + "id": "glm-4.6", + "name": "glm-4.6", + "display_name": "glm-4.6", "modalities": { "input": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 204800, + "output": 204800 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.068, - "output": 0.272 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "inclusionAI/Ring-flash-2.0", - "name": "inclusionAI/Ring-flash-2.0", - "display_name": "inclusionAI/Ring-flash-2.0", + "id": "glm-4.6v", + "name": "glm-4.6v", + "display_name": "glm-4.6v", "modalities": { "input": [ - "text" + "text", + "image", + "video" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 128000 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "cost": { - "input": 0.136, - "output": 0.544 + "input": 0.137, + "output": 0.411, + "cache_read": 0.0274 }, "type": "chat" }, { - "id": "irag-1.0", - "name": "irag-1.0", - "display_name": "irag-1.0", + "id": "jimeng-3.0-1080p", + "name": "jimeng-3.0-1080p", + "display_name": "jimeng-3.0-1080p", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -75870,15 +86836,14 @@ }, "cost": { "input": 2, - "output": 0, - "cache_read": 0 + "output": 0 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "jina-deepsearch-v1", - "name": "jina-deepsearch-v1", - "display_name": "jina-deepsearch-v1", + "id": "jimeng-3.0-720p", + "name": "jimeng-3.0-720p", + "display_name": "jimeng-3.0-720p", "modalities": { "input": [ "text", @@ -75886,24 +86851,23 @@ ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "cost": { - "input": 0.05, - "output": 0.05 + "input": 2, + "output": 0 }, "type": "chat" }, { - "id": "jina-embeddings-v4", - "name": "jina-embeddings-v4", - "display_name": "jina-embeddings-v4", + "id": "jimeng-3.0-pro", + "name": "jimeng-3.0-pro", + "display_name": "jimeng-3.0-pro", "modalities": { "input": [ "text", @@ -75919,43 +86883,47 @@ "supported": false }, "cost": { - "input": 0.05, - "output": 0.05 + "input": 2, + "output": 0 }, - "type": "embedding" + "type": "chat" }, { - "id": "jina-reranker-v3", - "name": "jina-reranker-v3", - "display_name": "jina-reranker-v3", + "id": "kimi-for-coding-free", + "name": "kimi-for-coding-free", + "display_name": "kimi-for-coding-free", "modalities": { "input": [ - "text", - "image" + "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 256000, + "output": 256000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.05, - "output": 0.05 + "input": 0, + "output": 0, + "cache_read": 0 }, - "type": "rerank" + "type": "chat" }, { - "id": "llama-4-maverick", - "name": "llama-4-maverick", - "display_name": "llama-4-maverick", + "id": "gemini-2.5-pro-search", + "name": "gemini-2.5-pro-search", + "display_name": "gemini-2.5-pro-search", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ] }, "limit": { @@ -75964,92 +86932,91 @@ }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.2, - "output": 0.2 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "llama-4-scout", - "name": "llama-4-scout", - "display_name": "llama-4-scout", + "id": "kimi-k2-thinking", + "name": "kimi-k2-thinking", + "display_name": "kimi-k2-thinking", "modalities": { "input": [ - "text", - "image" + "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 262144, + "output": 262144 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.548, + "output": 2.192, + "cache_read": 0.137 }, "type": "chat" }, { - "id": "qwen-image", - "name": "qwen-image", - "display_name": "qwen-image", + "id": "Kimi-K2-0905", + "name": "Kimi-K2-0905", + "display_name": "Kimi-K2-0905", "modalities": { "input": [ - "text", - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 262144 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 2, - "output": 0, - "cache_read": 0 + "input": 0.548, + "output": 2.192 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "qwen-image-edit", - "name": "qwen-image-edit", - "display_name": "qwen-image-edit", + "id": "DeepSeek-V3.1-Fast", + "name": "DeepSeek-V3.1-Fast", + "display_name": "DeepSeek-V3.1-Fast", "modalities": { "input": [ - "text", - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 163000, + "output": 163000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 2, - "output": 0, - "cache_read": 0 + "input": 1.096, + "output": 3.288 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "qwen-image-plus", - "name": "qwen-image-plus", - "display_name": "qwen-image-plus", + "id": "claude-opus-4-0", + "name": "claude-opus-4-0", + "display_name": "claude-opus-4-0", "modalities": { "input": [ "text", @@ -76057,306 +87024,317 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 200000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 2, - "output": 0, - "cache_read": 0 + "input": 16.5, + "output": 82.5 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "qwen-mt-plus", - "name": "qwen-mt-plus", - "display_name": "qwen-mt-plus", + "id": "claude-sonnet-4-0", + "name": "claude-sonnet-4-0", + "display_name": "claude-sonnet-4-0", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { - "context": 16000, - "output": 16000 + "context": 1000000, + "output": 1000000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.492, - "output": 1.476 + "input": 3.3, + "output": 16.5, + "cache_read": 0.33 }, "type": "chat" }, { - "id": "qwen-mt-turbo", - "name": "qwen-mt-turbo", - "display_name": "qwen-mt-turbo", + "id": "gemini-2.5-flash", + "name": "gemini-2.5-flash", + "display_name": "gemini-2.5-flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ] }, "limit": { - "context": 16000, - "output": 16000 + "context": 1048576, + "output": 1048576 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.192, - "output": 0.534912 + "input": 0.3, + "output": 2.499, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "qwen3-embedding-0.6b", - "name": "qwen3-embedding-0.6b", - "display_name": "qwen3-embedding-0.6b", + "id": "gemini-2.5-flash-preview-09-2025", + "name": "gemini-2.5-flash-preview-09-2025", + "display_name": "gemini-2.5-flash-preview-09-2025", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1048576, + "output": 1048576 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.068, - "output": 0.068 + "input": 0.3, + "output": 2.499, + "cache_read": 0.03 }, - "type": "embedding" + "type": "chat" }, { - "id": "qwen3-embedding-4b", - "name": "qwen3-embedding-4b", - "display_name": "qwen3-embedding-4b", + "id": "glm-4.5v", + "name": "glm-4.5v", + "display_name": "glm-4.5v", "modalities": { "input": [ - "text" + "text", + "image", + "video" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 64000, + "output": 64000 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.068, - "output": 0.068 + "input": 0.274, + "output": 0.822, + "cache_read": 0.274 }, - "type": "embedding" + "type": "chat" }, { - "id": "qwen3-embedding-8b", - "name": "qwen3-embedding-8b", - "display_name": "qwen3-embedding-8b", + "id": "gemini-2.5-flash-lite", + "name": "gemini-2.5-flash-lite", + "display_name": "gemini-2.5-flash-lite", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1048576, + "output": 1048576 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.068, - "output": 0.068 + "input": 0.1, + "output": 0.4, + "cache_read": 0.01 }, - "type": "embedding" + "type": "chat" }, { - "id": "qwen3-reranker-0.6b", - "name": "qwen3-reranker-0.6b", - "display_name": "qwen3-reranker-0.6b", + "id": "gemini-2.5-flash-lite-preview-09-2025", + "name": "gemini-2.5-flash-lite-preview-09-2025", + "display_name": "gemini-2.5-flash-lite-preview-09-2025", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ] }, "limit": { - "context": 16000, - "output": 16000 + "context": 1048576, + "output": 1048576 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.11, - "output": 0.11 + "input": 0.1, + "output": 0.4, + "cache_read": 0.01 }, - "type": "rerank" + "type": "chat" }, { - "id": "qwen3-reranker-4b", - "name": "qwen3-reranker-4b", - "display_name": "qwen3-reranker-4b", + "id": "gemini-2.5-flash-nothink", + "name": "gemini-2.5-flash-nothink", + "display_name": "gemini-2.5-flash-nothink", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1047576, + "output": 1047576 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.11, - "output": 0.11 + "input": 0.3, + "output": 2.499, + "cache_read": 0.03 }, - "type": "rerank" + "type": "chat" }, { - "id": "qwen3-reranker-8b", - "name": "qwen3-reranker-8b", - "display_name": "qwen3-reranker-8b", + "id": "gemini-2.5-flash-search", + "name": "gemini-2.5-flash-search", + "display_name": "gemini-2.5-flash-search", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ] }, "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.11, - "output": 0.11 - }, - "type": "rerank" - }, - { - "id": "tao-8k", - "name": "tao-8k", - "display_name": "tao-8k", - "limit": { - "context": 8192, - "output": 8192 + "context": 1048576, + "output": 1048576 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "cost": { - "input": 0.068, - "output": 0.068 + "cost": { + "input": 0.3, + "output": 2.499, + "cache_read": 0.03 }, - "type": "embedding" + "type": "chat" }, { - "id": "bce-reranker-base", - "name": "bce-reranker-base", - "display_name": "bce-reranker-base", + "id": "gemini-2.5-flash-preview-05-20-nothink", + "name": "gemini-2.5-flash-preview-05-20-nothink", + "display_name": "gemini-2.5-flash-preview-05-20-nothink", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1048576, + "output": 1048576 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.068, - "output": 0.068 + "input": 0.3, + "output": 2.499, + "cache_read": 0.03 }, - "type": "rerank" + "type": "chat" }, { - "id": "codex-mini-latest", - "name": "codex-mini-latest", - "display_name": "codex-mini-latest", + "id": "gemini-2.5-flash-preview-05-20-search", + "name": "gemini-2.5-flash-preview-05-20-search", + "display_name": "gemini-2.5-flash-preview-05-20-search", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1048576, + "output": 1048576 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 1.5, - "output": 6, - "cache_read": 0.375 + "input": 0.3, + "output": 2.499, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "doubao-seedream-4-0", - "name": "doubao-seedream-4-0", - "display_name": "doubao-seedream-4-0", + "id": "DeepSeek-V3-Fast", + "name": "DeepSeek-V3-Fast", + "display_name": "DeepSeek-V3-Fast", "modalities": { "input": [ - "text", - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 32000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 2, - "output": 0, - "cache_read": 0 + "input": 0.56, + "output": 2.24 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "embedding-v1", - "name": "embedding-v1", - "display_name": "embedding-v1", + "id": "veo-2.0-generate-001", + "name": "veo-2.0-generate-001", + "display_name": "veo-2.0-generate-001", "modalities": { "input": [ - "text" + "video" ] }, "limit": { @@ -76368,39 +87346,34 @@ "supported": false }, "cost": { - "input": 0.068, - "output": 0.068 + "input": 2, + "output": 2, + "cache_read": 0 }, - "type": "embedding" + "type": "chat" }, { - "id": "ernie-4.5-turbo-latest", - "name": "ernie-4.5-turbo-latest", - "display_name": "ernie-4.5-turbo-latest", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "veo3.1", + "name": "veo3.1", + "display_name": "veo3.1", "limit": { - "context": 135000, - "output": 135000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.11, - "output": 0.44 + "input": 200, + "output": 200 }, "type": "chat" }, { - "id": "ernie-irag-edit", - "name": "ernie-irag-edit", - "display_name": "ernie-irag-edit", + "id": "imagen-4.0", + "name": "imagen-4.0", + "display_name": "imagen-4.0", "modalities": { "input": [ "text", @@ -76411,21 +87384,21 @@ "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { "input": 2, - "output": 0, + "output": 2, "cache_read": 0 }, "type": "imageGeneration" }, { - "id": "jina-clip-v2", - "name": "jina-clip-v2", - "display_name": "jina-clip-v2", + "id": "imagen-4.0-fast-generate-001", + "name": "imagen-4.0-fast-generate-001", + "display_name": "imagen-4.0-fast-generate-001", "modalities": { "input": [ "text", @@ -76441,15 +87414,15 @@ "supported": false }, "cost": { - "input": 0.05, - "output": 0.05 + "input": 2, + "output": 2 }, - "type": "embedding" + "type": "imageGeneration" }, { - "id": "jina-reranker-m0", - "name": "jina-reranker-m0", - "display_name": "jina-reranker-m0", + "id": "imagen-4.0-fast-generate-preview-06-06", + "name": "imagen-4.0-fast-generate-preview-06-06", + "display_name": "imagen-4.0-fast-generate-preview-06-06", "modalities": { "input": [ "text", @@ -76465,18 +87438,19 @@ "supported": false }, "cost": { - "input": 0.05, - "output": 0.05 + "input": 2, + "output": 2 }, - "type": "rerank" + "type": "imageGeneration" }, { - "id": "jina-colbert-v2", - "name": "jina-colbert-v2", - "display_name": "jina-colbert-v2", + "id": "imagen-4.0-generate-001", + "name": "imagen-4.0-generate-001", + "display_name": "imagen-4.0-generate-001", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { @@ -76488,15 +87462,15 @@ "supported": false }, "cost": { - "input": 0.05, - "output": 0.05 + "input": 2, + "output": 2 }, - "type": "embedding" + "type": "imageGeneration" }, { - "id": "gpt-4o-search-preview", - "name": "gpt-4o-search-preview", - "display_name": "gpt-4o-search-preview", + "id": "imagen-4.0-ultra-generate-001", + "name": "imagen-4.0-ultra-generate-001", + "display_name": "imagen-4.0-ultra-generate-001", "modalities": { "input": [ "text", @@ -76504,47 +87478,48 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 2, + "output": 2 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "DeepSeek-R1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "imagen-4.0-ultra", + "name": "imagen-4.0-ultra", + "display_name": "imagen-4.0-ultra", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { - "context": 1638000, - "output": 1638000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.4, - "output": 2 + "input": 2, + "output": 2, + "cache_read": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "gpt-4o-mini-search-preview", - "name": "gpt-4o-mini-search-preview", - "display_name": "gpt-4o-mini-search-preview", + "id": "gpt-image-1", + "name": "gpt-image-1", + "display_name": "gpt-image-1", "modalities": { "input": [ "text", @@ -76552,27 +87527,28 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075 + "input": 5, + "output": 40, + "cache_read": 5 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "jina-embeddings-v3", - "name": "jina-embeddings-v3", - "display_name": "jina-embeddings-v3", + "id": "gpt-image-1-mini", + "name": "gpt-image-1-mini", + "display_name": "gpt-image-1-mini", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { @@ -76584,49 +87560,42 @@ "supported": false }, "cost": { - "input": 0.05, - "output": 0.05, - "cache_read": 0 + "input": 5, + "output": 40, + "cache_read": 5 }, - "type": "embedding" + "type": "imageGeneration" }, { - "id": "gemini-2.0-flash", - "name": "gemini-2.0-flash", - "display_name": "gemini-2.0-flash", + "id": "o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ] }, "limit": { - "context": 1048576, - "output": 1048576 + "context": 200000, + "output": 200000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 1.1, + "output": 4.4, + "cache_read": 0.275 }, "type": "chat" }, { - "id": "gemini-2.0-flash-preview-image-generation", - "name": "gemini-2.0-flash-preview-image-generation", - "display_name": "gemini-2.0-flash-preview-image-generation", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "paddleocr-vl-0.9b", + "name": "paddleocr-vl-0.9b", + "display_name": "paddleocr-vl-0.9b", "limit": { "context": 8192, "output": 8192 @@ -76636,73 +87605,68 @@ "supported": false }, "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0 + "input": 2, + "output": 0 }, "type": "chat" }, { - "id": "mimo-v2-flash-free", - "name": "mimo-v2-flash-free", - "display_name": "mimo-v2-flash-free", - "modalities": { - "input": [ - "text" - ] - }, + "id": "pp-structurev3", + "name": "pp-structurev3", + "display_name": "pp-structurev3", "limit": { - "context": 256000, - "output": 256000 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 2, + "output": 0 }, "type": "chat" }, { - "id": "FLUX.1-Kontext-pro", - "name": "FLUX.1-Kontext-pro", - "display_name": "FLUX.1-Kontext-pro", + "id": "qwen3-vl-235b-a22b-instruct", + "name": "qwen3-vl-235b-a22b-instruct", + "display_name": "qwen3-vl-235b-a22b-instruct", "modalities": { "input": [ "text", - "image" + "image", + "video" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131000, + "output": 131000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 40, - "output": 40 + "input": 0.274, + "output": 1.096 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "claude-3-7-sonnet", - "name": "claude-3-7-sonnet", - "display_name": "claude-3-7-sonnet", + "id": "qwen3-vl-235b-a22b-thinking", + "name": "qwen3-vl-235b-a22b-thinking", + "display_name": "qwen3-vl-235b-a22b-thinking", "modalities": { "input": [ "text", - "image" + "image", + "video" ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 131000, + "output": 131000 }, "tool_call": true, "reasoning": { @@ -76710,67 +87674,71 @@ "default": true }, "cost": { - "input": 3.3, - "output": 16.5 + "input": 0.274, + "output": 2.74 }, "type": "chat" }, { - "id": "ernie-4.5", - "name": "ernie-4.5", - "display_name": "ernie-4.5", + "id": "qwen3-vl-30b-a3b-instruct", + "name": "qwen3-vl-30b-a3b-instruct", + "display_name": "qwen3-vl-30b-a3b-instruct", "modalities": { "input": [ "text", - "image" + "image", + "video" ] }, "limit": { - "context": 160000, - "output": 160000 + "context": 128000, + "output": 128000 }, "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.068, - "output": 0.272 + "input": 0.1028, + "output": 0.4112 }, "type": "chat" }, { - "id": "ernie-4.5-turbo-vl", - "name": "ernie-4.5-turbo-vl", - "display_name": "ernie-4.5-turbo-vl", + "id": "qwen3-vl-30b-a3b-thinking", + "name": "qwen3-vl-30b-a3b-thinking", + "display_name": "qwen3-vl-30b-a3b-thinking", "modalities": { "input": [ "text", - "image" + "image", + "video" ] }, "limit": { - "context": 139000, - "output": 139000 + "context": 128000, + "output": 128000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.4, - "output": 1.2 + "input": 0.1028, + "output": 1.028 }, "type": "chat" }, { - "id": "FLUX-1.1-pro", - "name": "FLUX-1.1-pro", - "display_name": "FLUX-1.1-pro", + "id": "veo-3.0-generate-preview", + "name": "veo-3.0-generate-preview", + "display_name": "veo-3.0-generate-preview", "modalities": { "input": [ "text", - "image" + "image", + "video" ] }, "limit": { @@ -76782,42 +87750,41 @@ "supported": false }, "cost": { - "input": 40, - "output": 40, + "input": 2, + "output": 2, "cache_read": 0 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "veo-3.1-fast-generate-preview", + "name": "veo-3.1-fast-generate-preview", + "display_name": "veo-3.1-fast-generate-preview", "modalities": { "input": [ "text", - "image" + "image", + "video" ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 2, + "output": 0 }, "type": "chat" }, { - "id": "doubao-seed-1-6", - "name": "doubao-seed-1-6", - "display_name": "doubao-seed-1-6", + "id": "veo-3.1-generate-preview", + "name": "veo-3.1-generate-preview", + "display_name": "veo-3.1-generate-preview", "modalities": { "input": [ "text", @@ -76826,106 +87793,98 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "cost": { - "input": 0.18, - "output": 1.8, - "cache_read": 0.036 + "input": 2, + "output": 2, + "cache_read": 0 }, "type": "chat" }, { - "id": "doubao-seed-1-6-flash", - "name": "doubao-seed-1-6-flash", - "display_name": "doubao-seed-1-6-flash", + "id": "DeepSeek-OCR", + "name": "DeepSeek-OCR", + "display_name": "DeepSeek-OCR", "modalities": { "input": [ "text", - "image", - "video" + "image" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 8000, + "output": 8000 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "cost": { - "input": 0.044, - "output": 0.44, - "cache_read": 0.0088 + "input": 0.02, + "output": 0.02 }, "type": "chat" }, { - "id": "doubao-seed-1-6-lite", - "name": "doubao-seed-1-6-lite", - "display_name": "doubao-seed-1-6-lite", + "id": "deepseek-ocr", + "name": "deepseek-ocr", + "display_name": "deepseek-ocr", "modalities": { "input": [ "text", - "image", - "video" + "image" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 8000, + "output": 8000 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "cost": { - "input": 0.082, - "output": 0.656, - "cache_read": 0.0164 + "input": 0.02, + "output": 0.02 }, "type": "chat" }, { - "id": "doubao-seed-1-6-thinking", - "name": "doubao-seed-1-6-thinking", - "display_name": "doubao-seed-1-6-thinking", + "id": "ernie-5.0-thinking-exp", + "name": "ernie-5.0-thinking-exp", + "display_name": "ernie-5.0-thinking-exp", "modalities": { "input": [ "text", - "image", - "video" + "image" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 119000, + "output": 119000 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "cost": { - "input": 0.18, - "output": 1.8, - "cache_read": 0.036 + "input": 0.82192, + "output": 3.28768, + "cache_read": 0.82192 }, "type": "chat" }, { - "id": "qwen3-30b-a3b-instruct-2507", - "name": "qwen3-30b-a3b-instruct-2507", - "display_name": "qwen3-30b-a3b-instruct-2507", + "id": "flux-kontext-max", + "name": "flux-kontext-max", + "display_name": "flux-kontext-max", "limit": { "context": 8192, "output": 8192 @@ -76935,82 +87894,98 @@ "supported": false }, "cost": { - "input": 0.1028, - "output": 0.4112 + "input": 2, + "output": 0, + "cache_read": 0 + }, + "type": "chat" + }, + { + "id": "gemini-2.5-flash-image-preview", + "name": "gemini-2.5-flash-image-preview", + "display_name": "gemini-2.5-flash-image-preview", + "modalities": { + "input": [ + "image", + "text" + ] }, - "type": "chat" - }, - { - "id": "qwen3-30b-a3b-thinking-2507", - "name": "qwen3-30b-a3b-thinking-2507", - "display_name": "qwen3-30b-a3b-thinking-2507", "limit": { - "context": 8192, - "output": 8192 + "context": 32800, + "output": 32800 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.12, - "output": 1.2 + "input": 0.3, + "output": 1.2, + "cache_read": 0.3 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "qwen-3-235b-a22b-thinking-2507", - "name": "qwen-3-235b-a22b-thinking-2507", - "display_name": "qwen-3-235b-a22b-thinking-2507", + "id": "glm-4.5", + "name": "glm-4.5", + "display_name": "glm-4.5", + "modalities": { + "input": [ + "text" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 131072, + "output": 131072 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.28, - "output": 2.8 + "input": 0.4, + "output": 1.6 }, "type": "chat" }, { - "id": "gemini-embedding-001", - "name": "gemini-embedding-001", - "display_name": "gemini-embedding-001", + "id": "gpt-4.1", + "name": "gpt-4.1", + "display_name": "gpt-4.1", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1047576, + "output": 1047576 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.15, - "output": 0.15 + "input": 2, + "output": 8, + "cache_read": 0.5 }, - "type": "embedding" + "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "grok-4", + "name": "grok-4", + "display_name": "grok-4", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 256000, + "output": 256000 }, "tool_call": true, "reasoning": { @@ -77018,119 +87993,132 @@ "default": true }, "cost": { - "input": 0.18, - "output": 0.9 + "input": 3.3, + "output": 16.5, + "cache_read": 0.825 }, "type": "chat" }, { - "id": "DeepSeek-R1-Distill-Qwen-32B", - "name": "DeepSeek-R1-Distill-Qwen-32B", - "display_name": "DeepSeek-R1-Distill-Qwen-32B", + "id": "grok-4-fast-non-reasoning", + "name": "grok-4-fast-non-reasoning", + "display_name": "grok-4-fast-non-reasoning", "limit": { - "context": 8192, - "output": 8192 + "context": 2000000, + "output": 2000000 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.28, - "output": 0.84 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "DeepSeek-R1-Distill-Qwen-7B", - "name": "DeepSeek-R1-Distill-Qwen-7B", - "display_name": "DeepSeek-R1-Distill-Qwen-7B", + "id": "grok-4-fast-reasoning", + "name": "grok-4-fast-reasoning", + "display_name": "grok-4-fast-reasoning", "limit": { - "context": 8192, - "output": 8192 + "context": 2000000, + "output": 2000000 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.06, - "output": 0.12 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "QwQ-32B", - "name": "QwQ-32B", - "display_name": "QwQ-32B", + "id": "kimi-k2-0711", + "name": "kimi-k2-0711", + "display_name": "kimi-k2-0711", + "modalities": { + "input": [ + "text" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 131000, + "output": 131000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.28, - "output": 0.84 + "input": 0.54, + "output": 2.16 }, "type": "chat" }, { - "id": "Qwen2-VL-72B-Instruct", - "name": "Qwen2-VL-72B-Instruct", - "display_name": "Qwen2-VL-72B-Instruct", + "id": "kimi-k2-turbo-preview", + "name": "kimi-k2-turbo-preview", + "display_name": "kimi-k2-turbo-preview", "modalities": { "input": [ - "text", - "image", - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 262144 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 2.18, - "output": 6.54 + "input": 1.2, + "output": 4.8, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "Qwen2-VL-7B-Instruct", - "name": "Qwen2-VL-7B-Instruct", - "display_name": "Qwen2-VL-7B-Instruct", + "id": "gpt-4.1-mini", + "name": "gpt-4.1-mini", + "display_name": "gpt-4.1-mini", "modalities": { "input": [ "text", - "image", - "video" + "image" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1047576, + "output": 1047576 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.28, - "output": 0.7 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "cc-kimi-for-coding", - "name": "cc-kimi-for-coding", - "display_name": "cc-kimi-for-coding", + "id": "aihubmix-router", + "name": "aihubmix-router", + "display_name": "aihubmix-router", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -77140,88 +88128,123 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.2, - "cache_read": 0.02 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B", - "name": "Qwen/Qwen3-30B-A3B", - "display_name": "Qwen/Qwen3-30B-A3B", + "id": "gpt-4.1-nano", + "name": "gpt-4.1-nano", + "display_name": "gpt-4.1-nano", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 1047576, + "output": 1047576 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 1, - "output": 1 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "Qwen/Qwen3-32B", - "name": "Qwen/Qwen3-32B", - "display_name": "Qwen/Qwen3-32B", + "id": "gemini-2.5-pro-preview-05-06", + "name": "gemini-2.5-pro-preview-05-06", + "display_name": "gemini-2.5-pro-preview-05-06", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 1048576, + "output": 1048576 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.4, - "output": 0.8 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "Qwen/Qwen3-14B", - "name": "Qwen/Qwen3-14B", - "display_name": "Qwen/Qwen3-14B", + "id": "gemini-2.5-pro-preview-03-25", + "name": "gemini-2.5-pro-preview-03-25", + "display_name": "gemini-2.5-pro-preview-03-25", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.5, - "output": 0.5 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "Qwen/Qwen3-8B", - "name": "Qwen/Qwen3-8B", - "display_name": "Qwen/Qwen3-8B", + "id": "gemini-2.5-pro-preview-05-06-search", + "name": "gemini-2.5-pro-preview-05-06-search", + "display_name": "gemini-2.5-pro-preview-05-06-search", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ] + }, "limit": { "context": 8192, "output": 8192 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.2, - "output": 0.2 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "gemini-2.0-pro-exp-02-05-search", - "name": "gemini-2.0-pro-exp-02-05-search", - "display_name": "gemini-2.0-pro-exp-02-05-search", + "id": "gemini-2.5-pro-preview-03-25-search", + "name": "gemini-2.5-pro-preview-03-25-search", + "display_name": "gemini-2.5-pro-preview-03-25-search", "modalities": { "input": [ "text", @@ -77234,215 +88257,218 @@ "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { "input": 1.25, - "output": 5 + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "gemini-2.0-flash-search", - "name": "gemini-2.0-flash-search", - "display_name": "gemini-2.0-flash-search", + "id": "qwen3-max-preview", + "name": "qwen3-max-preview", + "display_name": "qwen3-max-preview", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ] }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.822, + "output": 3.288, + "cache_read": 0.822 }, "type": "chat" }, { - "id": "gemini-2.5-pro-preview-06-05", - "name": "gemini-2.5-pro-preview-06-05", - "display_name": "gemini-2.5-pro-preview-06-05", + "id": "qwen3-max", + "name": "qwen3-max", + "display_name": "qwen3-max", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ] }, "limit": { - "context": 1048576, - "output": 1048576 + "context": 262144, + "output": 262144 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.34246, + "output": 1.36984, + "cache_read": 0.34246 }, "type": "chat" }, { - "id": "Aihubmix-MAI-DS-R1", - "name": "Aihubmix-MAI-DS-R1", - "display_name": "Aihubmix-MAI-DS-R1", + "id": "qwen3-next-80b-a3b-instruct", + "name": "qwen3-next-80b-a3b-instruct", + "display_name": "qwen3-next-80b-a3b-instruct", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 256000, + "output": 256000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.6, - "output": 1.8 + "input": 0.138, + "output": 0.552 }, "type": "chat" }, { - "id": "embedding-2", - "name": "embedding-2", - "display_name": "embedding-2", + "id": "qwen3-next-80b-a3b-thinking", + "name": "qwen3-next-80b-a3b-thinking", + "display_name": "qwen3-next-80b-a3b-thinking", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { - "context": 8000, - "output": 8000 + "context": 256000, + "output": 256000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.0686, - "output": 0.0686 + "input": 0.138, + "output": 1.38 }, - "type": "embedding" + "type": "chat" }, { - "id": "embedding-3", - "name": "embedding-3", - "display_name": "embedding-3", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "qwen3-235b-a22b-instruct-2507", + "display_name": "qwen3-235b-a22b-instruct-2507", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { - "context": 8000, - "output": 8000 + "context": 262144, + "output": 262144 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.0686, - "output": 0.0686 + "input": 0.28, + "output": 1.12 }, - "type": "embedding" + "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-72B-Instruct", - "name": "Qwen/Qwen2.5-VL-72B-Instruct", - "display_name": "Qwen/Qwen2.5-VL-72B-Instruct", + "id": "qwen3-235b-a22b-thinking-2507", + "name": "qwen3-235b-a22b-thinking-2507", + "display_name": "qwen3-235b-a22b-thinking-2507", "modalities": { "input": [ "text", - "image", - "video" + "image" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 262144 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.5, - "output": 0.5, - "cache_read": 0 + "input": 0.28, + "output": 2.8 }, "type": "chat" }, { - "id": "o1", - "name": "o1", - "display_name": "o1", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "qwen3-coder-30b-a3b-instruct", + "display_name": "qwen3-coder-30b-a3b-instruct", "modalities": { "input": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 2000000, + "output": 2000000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0.2, + "output": 0.8, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "o1-pro", - "name": "o1-pro", - "display_name": "o1-pro", + "id": "qwen3-coder-480b-a35b-instruct", + "name": "qwen3-coder-480b-a35b-instruct", + "display_name": "qwen3-coder-480b-a35b-instruct", "modalities": { "input": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262000, + "output": 262000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "cost": { - "input": 170, - "output": 680, - "cache_read": 170 + "input": 0.82, + "output": 3.28, + "cache_read": 0.82 }, "type": "chat" }, { - "id": "ByteDance-Seed/Seed-OSS-36B-Instruct", - "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", - "display_name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "id": "qwen3-235b-a22b", + "name": "qwen3-235b-a22b", + "display_name": "qwen3-235b-a22b", "modalities": { "input": [ "text", @@ -77450,100 +88476,129 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 131100, + "output": 131100 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "cost": { - "input": 0.2, - "output": 0.534 + "input": 0.28, + "output": 1.12 }, "type": "chat" }, { - "id": "doubao-seed-1-6-250615", - "name": "doubao-seed-1-6-250615", - "display_name": "doubao-seed-1-6-250615", + "id": "qwen3-coder-flash", + "name": "qwen3-coder-flash", + "display_name": "qwen3-coder-flash", + "modalities": { + "input": [ + "text" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 256000, + "output": 256000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.18, - "output": 2.52, - "cache_read": 0.036 + "input": 0.136, + "output": 0.544, + "cache_read": 0.136 }, "type": "chat" }, { - "id": "doubao-seed-1-6-flash-250615", - "name": "doubao-seed-1-6-flash-250615", - "display_name": "doubao-seed-1-6-flash-250615", + "id": "qwen3-coder-plus", + "name": "qwen3-coder-plus", + "display_name": "qwen3-coder-plus", + "modalities": { + "input": [ + "text" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 1048576, + "output": 1048576 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.044, - "output": 0.44, - "cache_read": 0.0088 + "input": 0.54, + "output": 2.16, + "cache_read": 0.108 }, "type": "chat" }, { - "id": "doubao-seed-1-6-thinking-250615", - "name": "doubao-seed-1-6-thinking-250615", - "display_name": "doubao-seed-1-6-thinking-250615", + "id": "qwen3-coder-plus-2025-07-22", + "name": "qwen3-coder-plus-2025-07-22", + "display_name": "qwen3-coder-plus-2025-07-22", + "modalities": { + "input": [ + "text" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.18, - "output": 2.52, - "cache_read": 0.036 + "input": 0.54, + "output": 2.16, + "cache_read": 0.54 }, "type": "chat" }, { - "id": "doubao-seed-1-6-vision-250815", - "name": "doubao-seed-1-6-vision-250815", - "display_name": "doubao-seed-1-6-vision-250815", + "id": "gemini-2.5-pro-preview-06-05-search", + "name": "gemini-2.5-pro-preview-06-05-search", + "display_name": "gemini-2.5-pro-preview-06-05-search", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ] + }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.10959, - "output": 1.0959, - "cache_read": 0.021918 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "Doubao-1.5-thinking-pro", - "name": "Doubao-1.5-thinking-pro", - "display_name": "Doubao-1.5-thinking-pro", + "id": "imagen-4.0-ultra-generate-exp-05-20", + "name": "imagen-4.0-ultra-generate-exp-05-20", + "display_name": "imagen-4.0-ultra-generate-exp-05-20", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -77553,39 +88608,39 @@ "supported": false }, "cost": { - "input": 0.62, - "output": 2.48, - "cache_read": 0.62 + "input": 2, + "output": 2, + "cache_read": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "cc-minimax-m2", - "name": "cc-minimax-m2", - "display_name": "cc-minimax-m2", + "id": "DeepSeek-V3", + "name": "DeepSeek-V3", + "display_name": "DeepSeek-V3", "modalities": { "input": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1638000, + "output": 1638000 }, "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.272, + "output": 1.088 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-Prover-V2-671B", - "name": "deepseek-ai/DeepSeek-Prover-V2-671B", - "display_name": "deepseek-ai/DeepSeek-Prover-V2-671B", + "id": "LongCat-Flash-Chat", + "name": "LongCat-Flash-Chat", + "display_name": "LongCat-Flash-Chat", "limit": { "context": 8192, "output": 8192 @@ -77595,15 +88650,22 @@ "supported": false }, "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.14, + "output": 0.7 }, "type": "chat" }, { - "id": "gemma-3-12b-it", - "name": "gemma-3-12b-it", - "display_name": "gemma-3-12b-it", + "id": "Qwen2.5-VL-72B-Instruct", + "name": "Qwen2.5-VL-72B-Instruct", + "display_name": "Qwen2.5-VL-72B-Instruct", + "modalities": { + "input": [ + "text", + "image", + "video" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -77613,77 +88675,90 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.2, - "cache_read": 0 + "input": 0.62, + "output": 0.62 }, "type": "chat" }, { - "id": "gemma-3-27b-it", - "name": "gemma-3-27b-it", - "display_name": "gemma-3-27b-it", + "id": "ernie-5.0-thinking-preview", + "name": "ernie-5.0-thinking-preview", + "display_name": "ernie-5.0-thinking-preview", + "modalities": { + "input": [ + "text" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 183000, + "output": 183000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.2, - "output": 0.2, - "cache_read": 0 + "input": 0.822, + "output": 3.288, + "cache_read": 0.822 }, "type": "chat" }, { - "id": "gemma-3-4b-it", - "name": "gemma-3-4b-it", - "display_name": "gemma-3-4b-it", + "id": "inclusionAI/Ling-1T", + "name": "inclusionAI/Ling-1T", + "display_name": "inclusionAI/Ling-1T", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.2, - "output": 0.2, - "cache_read": 0 + "input": 0.548, + "output": 2.192 }, "type": "chat" }, { - "id": "gemma-3n-e4b-it", - "name": "gemma-3n-e4b-it", - "display_name": "gemma-3n-e4b-it", + "id": "inclusionAI/Ring-1T", + "name": "inclusionAI/Ring-1T", + "display_name": "inclusionAI/Ring-1T", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.2, - "output": 0.2, - "cache_read": 0 + "input": 0.548, + "output": 2.192 }, "type": "chat" }, { - "id": "gpt-4o-image-vip", - "name": "gpt-4o-image-vip", - "display_name": "gpt-4o-image-vip", + "id": "embedding-v1", + "name": "embedding-v1", + "display_name": "embedding-v1", "modalities": { "input": [ - "text", - "image" + "text" ] }, "limit": { @@ -77695,16 +88770,15 @@ "supported": false }, "cost": { - "input": 7, - "output": 7, - "cache_read": 0 + "input": 0.068, + "output": 0.068 }, - "type": "imageGeneration" + "type": "embedding" }, { - "id": "gpt-4o-image", - "name": "gpt-4o-image", - "display_name": "gpt-4o-image", + "id": "ernie-4.5-turbo-latest", + "name": "ernie-4.5-turbo-latest", + "display_name": "ernie-4.5-turbo-latest", "modalities": { "input": [ "text", @@ -77712,43 +88786,48 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 135000, + "output": 135000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 3, - "output": 3, - "cache_read": 0 + "input": 0.11, + "output": 0.44 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "gemma-3-1b-it", - "name": "gemma-3-1b-it", - "display_name": "gemma-3-1b-it", + "id": "ernie-irag-edit", + "name": "ernie-irag-edit", + "display_name": "ernie-irag-edit", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.2, - "output": 0.2, + "input": 2, + "output": 0, "cache_read": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "deepseek-r1-distill-llama-70b", - "name": "deepseek-r1-distill-llama-70b", - "display_name": "deepseek-r1-distill-llama-70b", + "id": "glm-4.5-x", + "name": "glm-4.5-x", + "display_name": "glm-4.5-x", "modalities": { "input": [ "text" @@ -77760,22 +88839,24 @@ }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "cost": { - "input": 0.8, - "output": 1.6 + "input": 2.2, + "output": 8.91, + "cache_read": 0.44 }, "type": "chat" }, { - "id": "gpt-4o-mini-tts", - "name": "gpt-4o-mini-tts", - "display_name": "gpt-4o-mini-tts", + "id": "gme-qwen2-vl-2b-instruct", + "name": "gme-qwen2-vl-2b-instruct", + "display_name": "gme-qwen2-vl-2b-instruct", "modalities": { "input": [ - "audio" + "text", + "image", + "video" ] }, "limit": { @@ -77787,20 +88868,19 @@ "supported": false }, "cost": { - "input": 15, - "output": 15 - } + "input": 0.138, + "output": 0.138 + }, + "type": "embedding" }, { - "id": "gemini-2.0-flash-exp", - "name": "gemini-2.0-flash-exp", - "display_name": "gemini-2.0-flash-exp", + "id": "gte-rerank-v2", + "name": "gte-rerank-v2", + "display_name": "gte-rerank-v2", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ] }, "limit": { @@ -77812,83 +88892,85 @@ "supported": false }, "cost": { - "input": 0.02, - "output": 0.08 + "input": 0.11, + "output": 0.11 }, - "type": "chat" + "type": "rerank" }, { - "id": "tngtech/DeepSeek-R1T-Chimera", - "name": "tngtech/DeepSeek-R1T-Chimera", - "display_name": "tngtech/DeepSeek-R1T-Chimera", + "id": "inclusionAI/Ling-flash-2.0", + "name": "inclusionAI/Ling-flash-2.0", + "display_name": "inclusionAI/Ling-flash-2.0", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.02, - "output": 0.02 + "input": 0.136, + "output": 0.544 }, "type": "chat" }, { - "id": "claude-3-5-sonnet", - "name": "claude-3-5-sonnet", - "display_name": "claude-3-5-sonnet", + "id": "inclusionAI/Ling-mini-2.0", + "name": "inclusionAI/Ling-mini-2.0", + "display_name": "inclusionAI/Ling-mini-2.0", "modalities": { "input": [ - "text", - "image" + "text" ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 8192, + "output": 8192 }, "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 3.3, - "output": 16.5 + "input": 0.068, + "output": 0.272 }, "type": "chat" }, { - "id": "o1-preview", - "name": "o1-preview", - "display_name": "o1-preview", + "id": "inclusionAI/Ring-flash-2.0", + "name": "inclusionAI/Ring-flash-2.0", + "display_name": "inclusionAI/Ring-flash-2.0", "modalities": { "input": [ - "text", - "image" + "text" ] }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0.136, + "output": 0.544 }, "type": "chat" }, { - "id": "o1-mini", - "name": "o1-mini", - "display_name": "o1-mini", + "id": "irag-1.0", + "name": "irag-1.0", + "display_name": "irag-1.0", "limit": { "context": 8192, "output": 8192 @@ -77898,27 +88980,25 @@ "supported": false }, "cost": { - "input": 3, - "output": 12, - "cache_read": 1.5 + "input": 2, + "output": 0, + "cache_read": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "gemini-2.0-flash-thinking-exp-01-21", - "name": "gemini-2.0-flash-thinking-exp-01-21", - "display_name": "gemini-2.0-flash-thinking-exp-01-21", + "id": "jina-deepsearch-v1", + "name": "jina-deepsearch-v1", + "display_name": "jina-deepsearch-v1", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1000000, + "output": 1000000 }, "tool_call": false, "reasoning": { @@ -77926,15 +89006,15 @@ "default": true }, "cost": { - "input": 0.076, - "output": 0.304 + "input": 0.05, + "output": 0.05 }, "type": "chat" }, { - "id": "gpt-4o-2024-11-20", - "name": "gpt-4o-2024-11-20", - "display_name": "gpt-4o-2024-11-20", + "id": "jina-embeddings-v4", + "name": "jina-embeddings-v4", + "display_name": "jina-embeddings-v4", "modalities": { "input": [ "text", @@ -77942,24 +89022,23 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.05, + "output": 0.05 }, - "type": "chat" + "type": "embedding" }, { - "id": "gpt-4o", - "name": "gpt-4o", - "display_name": "gpt-4o", + "id": "jina-reranker-v3", + "name": "jina-reranker-v3", + "display_name": "jina-reranker-v3", "modalities": { "input": [ "text", @@ -77967,24 +89046,23 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131000, + "output": 131000 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.05, + "output": 0.05 }, - "type": "chat" + "type": "rerank" }, { - "id": "chatgpt-4o-latest", - "name": "chatgpt-4o-latest", - "display_name": "chatgpt-4o-latest", + "id": "llama-4-maverick", + "name": "llama-4-maverick", + "display_name": "llama-4-maverick", "modalities": { "input": [ "text", @@ -77992,23 +89070,23 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1048576, + "output": 1048576 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 5, - "output": 15 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "gpt-4o-mini", - "name": "gpt-4o-mini", - "display_name": "gpt-4o-mini", + "id": "llama-4-scout", + "name": "llama-4-scout", + "display_name": "llama-4-scout", "modalities": { "input": [ "text", @@ -78016,24 +89094,29 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131000, + "output": 131000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "AiHubmix-mistral-medium", - "name": "AiHubmix-mistral-medium", - "display_name": "AiHubmix-mistral-medium", + "id": "qwen-image", + "name": "qwen-image", + "display_name": "qwen-image", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -78043,21 +89126,20 @@ "supported": false }, "cost": { - "input": 0.4, - "output": 2 + "input": 2, + "output": 0, + "cache_read": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "gemini-2.0-pro-exp-02-05", - "name": "gemini-2.0-pro-exp-02-05", - "display_name": "gemini-2.0-pro-exp-02-05", + "id": "qwen-image-edit", + "name": "qwen-image-edit", + "display_name": "qwen-image-edit", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ] }, "limit": { @@ -78069,15 +89151,22 @@ "supported": false }, "cost": { - "input": 1.25, - "output": 5 + "input": 2, + "output": 0, + "cache_read": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "ernie-x1.1-preview", - "name": "ernie-x1.1-preview", - "display_name": "ernie-x1.1-preview", + "id": "qwen-image-plus", + "name": "qwen-image-plus", + "display_name": "qwen-image-plus", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -78087,80 +89176,113 @@ "supported": false }, "cost": { - "input": 0.136, - "output": 0.544 + "input": 2, + "output": 0, + "cache_read": 0 + }, + "type": "imageGeneration" + }, + { + "id": "qwen-mt-plus", + "name": "qwen-mt-plus", + "display_name": "qwen-mt-plus", + "modalities": { + "input": [ + "text" + ] + }, + "limit": { + "context": 16000, + "output": 16000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.492, + "output": 1.476 }, "type": "chat" }, { - "id": "minimax-m2", - "name": "minimax-m2", - "display_name": "minimax-m2", + "id": "qwen-mt-turbo", + "name": "qwen-mt-turbo", + "display_name": "qwen-mt-turbo", "modalities": { "input": [ "text" ] }, "limit": { - "context": 204800, - "output": 204800 + "context": 16000, + "output": 16000 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.288, - "output": 1.152 + "input": 0.192, + "output": 0.534912 }, "type": "chat" }, { - "id": "ERNIE-X1.1-Preview", - "name": "ERNIE-X1.1-Preview", - "display_name": "ERNIE-X1.1-Preview", + "id": "qwen3-embedding-0.6b", + "name": "qwen3-embedding-0.6b", + "display_name": "qwen3-embedding-0.6b", "modalities": { "input": [ "text" ] }, "limit": { - "context": 119000, - "output": 119000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "cost": { - "input": 0.136, - "output": 0.544 + "input": 0.068, + "output": 0.068 }, - "type": "chat" + "type": "embedding" }, { - "id": "Qwen/QwQ-32B", - "name": "Qwen/QwQ-32B", - "display_name": "Qwen/QwQ-32B", + "id": "qwen3-embedding-4b", + "name": "qwen3-embedding-4b", + "display_name": "qwen3-embedding-4b", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.14, - "output": 0.56 + "input": 0.068, + "output": 0.068 }, - "type": "chat" + "type": "embedding" }, { - "id": "chutesai/Mistral-Small-3.1-24B-Instruct-2503", - "name": "chutesai/Mistral-Small-3.1-24B-Instruct-2503", - "display_name": "chutesai/Mistral-Small-3.1-24B-Instruct-2503", + "id": "qwen3-embedding-8b", + "name": "qwen3-embedding-8b", + "display_name": "qwen3-embedding-8b", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -78170,58 +89292,63 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.8 + "input": 0.068, + "output": 0.068 }, - "type": "chat" + "type": "embedding" }, { - "id": "MiniMaxAI/MiniMax-M1-80k", - "name": "MiniMaxAI/MiniMax-M1-80k", - "display_name": "MiniMaxAI/MiniMax-M1-80k", + "id": "qwen3-reranker-0.6b", + "name": "qwen3-reranker-0.6b", + "display_name": "qwen3-reranker-0.6b", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 16000, + "output": 16000 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.6, - "output": 2.4 + "input": 0.11, + "output": 0.11 }, - "type": "chat" + "type": "rerank" }, { - "id": "Qwen/Qwen2.5-VL-32B-Instruct", - "name": "Qwen/Qwen2.5-VL-32B-Instruct", - "display_name": "Qwen/Qwen2.5-VL-32B-Instruct", + "id": "qwen3-reranker-4b", + "name": "qwen3-reranker-4b", + "display_name": "qwen3-reranker-4b", "modalities": { "input": [ "text", - "image", - "video" + "image" ] }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.24, - "output": 0.24 + "input": 0.11, + "output": 0.11 }, - "type": "chat" + "type": "rerank" }, { - "id": "baidu/ERNIE-4.5-300B-A47B", - "name": "baidu/ERNIE-4.5-300B-A47B", - "display_name": "baidu/ERNIE-4.5-300B-A47B", + "id": "qwen3-reranker-8b", + "name": "qwen3-reranker-8b", + "display_name": "qwen3-reranker-8b", "modalities": { "input": [ "text", @@ -78232,32 +89359,25 @@ "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.32, - "output": 1.28, - "cache_read": 0 + "input": 0.11, + "output": 0.11 }, - "type": "chat" + "type": "rerank" }, { - "id": "bge-large-en", - "name": "bge-large-en", - "display_name": "bge-large-en", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "tao-8k", + "name": "tao-8k", + "display_name": "tao-8k", "limit": { "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, @@ -78268,9 +89388,9 @@ "type": "embedding" }, { - "id": "bge-large-zh", - "name": "bge-large-zh", - "display_name": "bge-large-zh", + "id": "bce-reranker-base", + "name": "bce-reranker-base", + "display_name": "bce-reranker-base", "modalities": { "input": [ "text", @@ -78281,7 +89401,7 @@ "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, @@ -78289,12 +89409,18 @@ "input": 0.068, "output": 0.068 }, - "type": "embedding" + "type": "rerank" }, { - "id": "codestral-latest", - "name": "codestral-latest", - "display_name": "codestral-latest", + "id": "codex-mini-latest", + "name": "codex-mini-latest", + "display_name": "codex-mini-latest", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -78304,15 +89430,16 @@ "supported": false }, "cost": { - "input": 0.4, - "output": 1.2 + "input": 1.5, + "output": 6, + "cache_read": 0.375 }, "type": "chat" }, { - "id": "ernie-4.5-0.3b", - "name": "ernie-4.5-0.3b", - "display_name": "ernie-4.5-0.3b", + "id": "doubao-seedream-4-0", + "name": "doubao-seedream-4-0", + "display_name": "doubao-seedream-4-0", "modalities": { "input": [ "text", @@ -78323,20 +89450,21 @@ "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.0136, - "output": 0.0544 + "input": 2, + "output": 0, + "cache_read": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "ernie-4.5-turbo-128k-preview", - "name": "ernie-4.5-turbo-128k-preview", - "display_name": "ernie-4.5-turbo-128k-preview", + "id": "jina-clip-v2", + "name": "jina-clip-v2", + "display_name": "jina-clip-v2", "modalities": { "input": [ "text", @@ -78347,71 +89475,71 @@ "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.108, - "output": 0.432 + "input": 0.05, + "output": 0.05 }, - "type": "chat" + "type": "embedding" }, { - "id": "ernie-x1-turbo", - "name": "ernie-x1-turbo", - "display_name": "ernie-x1-turbo", + "id": "jina-reranker-m0", + "name": "jina-reranker-m0", + "display_name": "jina-reranker-m0", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { - "context": 50500, - "output": 50500 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "cost": { - "input": 0.136, - "output": 0.544 + "input": 0.05, + "output": 0.05 }, - "type": "chat" + "type": "rerank" }, { - "id": "gemini-2.0-flash-exp-search", - "name": "gemini-2.0-flash-exp-search", - "display_name": "gemini-2.0-flash-exp-search", + "id": "jina-colbert-v2", + "name": "jina-colbert-v2", + "display_name": "jina-colbert-v2", "modalities": { "input": [ - "text", - "image" + "text" ] }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.05, + "output": 0.05 }, - "type": "chat" + "type": "embedding" }, { - "id": "kat-dev", - "name": "kat-dev", - "display_name": "kat-dev", + "id": "gpt-4o-search-preview", + "name": "gpt-4o-search-preview", + "display_name": "gpt-4o-search-preview", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { @@ -78423,52 +89551,69 @@ "supported": false }, "cost": { - "input": 0.137, - "output": 0.548 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "llama-3.3-70b", - "name": "llama-3.3-70b", - "display_name": "llama-3.3-70b", + "id": "DeepSeek-R1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", + "modalities": { + "input": [ + "text" + ] + }, "limit": { - "context": 65536, - "output": 65536 + "context": 1638000, + "output": 1638000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.6, - "output": 0.6 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "moonshotai/Kimi-Dev-72B", - "name": "moonshotai/Kimi-Dev-72B", - "display_name": "moonshotai/Kimi-Dev-72B", + "id": "gpt-4o-mini-search-preview", + "name": "gpt-4o-mini-search-preview", + "display_name": "gpt-4o-mini-search-preview", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.32, - "output": 1.28, - "cache_read": 0 + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "moonshotai/Moonlight-16B-A3B-Instruct", - "name": "moonshotai/Moonlight-16B-A3B-Instruct", - "display_name": "moonshotai/Moonlight-16B-A3B-Instruct", + "id": "jina-embeddings-v3", + "name": "jina-embeddings-v3", + "display_name": "jina-embeddings-v3", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -78478,53 +89623,40 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.2, + "input": 0.05, + "output": 0.05, "cache_read": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "o1-global", - "name": "o1-global", - "display_name": "o1-global", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "id": "ernie-4.5", + "name": "ernie-4.5", + "display_name": "ernie-4.5", + "modalities": { + "input": [ + "text", + "image" + ] }, - "type": "chat" - }, - { - "id": "qianfan-qi-vl", - "name": "qianfan-qi-vl", - "display_name": "qianfan-qi-vl", "limit": { - "context": 8192, - "output": 8192 + "context": 160000, + "output": 160000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.2, - "output": 0.6 + "input": 0.068, + "output": 0.272 }, "type": "chat" }, { - "id": "qwen2.5-vl-72b-instruct", - "name": "qwen2.5-vl-72b-instruct", - "display_name": "qwen2.5-vl-72b-instruct", + "id": "ernie-4.5-turbo-vl", + "name": "ernie-4.5-turbo-vl", + "display_name": "ernie-4.5-turbo-vl", "modalities": { "input": [ "text", @@ -78532,41 +89664,56 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 139000, + "output": 139000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 2.4, - "output": 7.2 + "input": 0.4, + "output": 1.2 }, "type": "chat" }, { - "id": "tencent/Hunyuan-A13B-Instruct", - "name": "tencent/Hunyuan-A13B-Instruct", - "display_name": "tencent/Hunyuan-A13B-Instruct", + "id": "gemini-2.0-flash", + "name": "gemini-2.0-flash", + "display_name": "gemini-2.0-flash", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 1048576, + "output": 1048576 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.14, - "output": 0.56 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "unsloth/gemma-3-27b-it", - "name": "unsloth/gemma-3-27b-it", - "display_name": "unsloth/gemma-3-27b-it", + "id": "gemini-2.0-flash-preview-image-generation", + "name": "gemini-2.0-flash-preview-image-generation", + "display_name": "gemini-2.0-flash-preview-image-generation", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -78576,53 +89723,46 @@ "supported": false }, "cost": { - "input": 0.22, - "output": 0.22, + "input": 0.1, + "output": 0.4, "cache_read": 0 }, "type": "chat" }, { - "id": "qwen-qwq-32b", - "name": "qwen-qwq-32b", - "display_name": "qwen-qwq-32b", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.4, - "output": 0.8 + "id": "mimo-v2-flash-free", + "name": "mimo-v2-flash-free", + "display_name": "mimo-v2-flash-free", + "modalities": { + "input": [ + "text" + ] }, - "type": "chat" - }, - { - "id": "unsloth/gemma-3-12b-it", - "name": "unsloth/gemma-3-12b-it", - "display_name": "unsloth/gemma-3-12b-it", "limit": { - "context": 8192, - "output": 8192 + "context": 256000, + "output": 256000 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.2, - "output": 0.8, + "input": 0, + "output": 0, "cache_read": 0 }, "type": "chat" }, { - "id": "gemini-exp-1206", - "name": "gemini-exp-1206", - "display_name": "gemini-exp-1206", + "id": "FLUX.1-Kontext-pro", + "name": "FLUX.1-Kontext-pro", + "display_name": "FLUX.1-Kontext-pro", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -78632,15 +89772,15 @@ "supported": false }, "cost": { - "input": 1.25, - "output": 5 + "input": 40, + "output": 40 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "gpt-4o-zh", - "name": "gpt-4o-zh", - "display_name": "gpt-4o-zh", + "id": "claude-3-7-sonnet", + "name": "claude-3-7-sonnet", + "display_name": "claude-3-7-sonnet", "modalities": { "input": [ "text", @@ -78648,23 +89788,24 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 200000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 2.5, - "output": 10 + "input": 3.3, + "output": 16.5 }, "type": "chat" }, { - "id": "claude-3-5-haiku", - "name": "claude-3-5-haiku", - "display_name": "claude-3-5-haiku", + "id": "FLUX-1.1-pro", + "name": "FLUX-1.1-pro", + "display_name": "FLUX-1.1-pro", "modalities": { "input": [ "text", @@ -78672,131 +89813,158 @@ ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 1.1, - "output": 5.5 + "input": 40, + "output": 40, + "cache_read": 0 + }, + "type": "imageGeneration" + }, + { + "id": "o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", + "modalities": { + "input": [ + "text", + "image" + ] }, - "type": "chat" - }, - { - "id": "qwen-max-0125", - "name": "qwen-max-0125", - "display_name": "qwen-max-0125", "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 200000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.38, - "output": 1.52 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "tencent/Hunyuan-MT-7B", - "name": "tencent/Hunyuan-MT-7B", - "display_name": "tencent/Hunyuan-MT-7B", + "id": "doubao-seed-1-6", + "name": "doubao-seed-1-6", + "display_name": "doubao-seed-1-6", + "modalities": { + "input": [ + "text", + "image", + "video" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 256000, + "output": 256000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.18, + "output": 1.8, + "cache_read": 0.036 }, "type": "chat" }, { - "id": "BAAI/bge-large-en-v1.5", - "name": "BAAI/bge-large-en-v1.5", - "display_name": "BAAI/bge-large-en-v1.5", + "id": "doubao-seed-1-6-flash", + "name": "doubao-seed-1-6-flash", + "display_name": "doubao-seed-1-6-flash", "modalities": { "input": [ "text", - "image" + "image", + "video" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 256000, + "output": 256000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.034, - "output": 0.034 + "input": 0.044, + "output": 0.44, + "cache_read": 0.0088 }, - "type": "embedding" + "type": "chat" }, { - "id": "BAAI/bge-large-zh-v1.5", - "name": "BAAI/bge-large-zh-v1.5", - "display_name": "BAAI/bge-large-zh-v1.5", + "id": "doubao-seed-1-6-lite", + "name": "doubao-seed-1-6-lite", + "display_name": "doubao-seed-1-6-lite", "modalities": { "input": [ "text", - "image" + "image", + "video" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 256000, + "output": 256000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.034, - "output": 0.034 + "input": 0.082, + "output": 0.656, + "cache_read": 0.0164 }, - "type": "embedding" + "type": "chat" }, { - "id": "BAAI/bge-reranker-v2-m3", - "name": "BAAI/bge-reranker-v2-m3", - "display_name": "BAAI/bge-reranker-v2-m3", + "id": "doubao-seed-1-6-thinking", + "name": "doubao-seed-1-6-thinking", + "display_name": "doubao-seed-1-6-thinking", "modalities": { "input": [ "text", - "image" + "image", + "video" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 256000, + "output": 256000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.034, - "output": 0.034 + "input": 0.18, + "output": 1.8, + "cache_read": 0.036 }, - "type": "rerank" + "type": "chat" }, { - "id": "gemini-2.0-flash-lite-preview-02-05", - "name": "gemini-2.0-flash-lite-preview-02-05", - "display_name": "gemini-2.0-flash-lite-preview-02-05", + "id": "qwen3-30b-a3b-instruct-2507", + "name": "qwen3-30b-a3b-instruct-2507", + "display_name": "qwen3-30b-a3b-instruct-2507", "limit": { "context": 8192, "output": 8192 @@ -78806,22 +89974,15 @@ "supported": false }, "cost": { - "input": 0.075, - "output": 0.3, - "cache_read": 0.075 + "input": 0.1028, + "output": 0.4112 }, "type": "chat" }, { - "id": "V3", - "name": "V3", - "display_name": "V3", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "qwen3-30b-a3b-thinking-2507", + "name": "qwen3-30b-a3b-thinking-2507", + "display_name": "qwen3-30b-a3b-thinking-2507", "limit": { "context": 8192, "output": 8192 @@ -78831,16 +89992,15 @@ "supported": false }, "cost": { - "input": 2, - "output": 2, - "cache_read": 0 + "input": 0.12, + "output": 1.2 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "sonar-reasoning", - "name": "sonar-reasoning", - "display_name": "sonar-reasoning", + "id": "qwen-3-235b-a22b-thinking-2507", + "name": "qwen-3-235b-a22b-thinking-2507", + "display_name": "qwen-3-235b-a22b-thinking-2507", "limit": { "context": 8192, "output": 8192 @@ -78850,19 +90010,18 @@ "supported": false }, "cost": { - "input": 1.6, - "output": 8 + "input": 0.28, + "output": 2.8 }, "type": "chat" }, { - "id": "V_2", - "name": "V_2", - "display_name": "V_2", + "id": "gemini-embedding-001", + "name": "gemini-embedding-001", + "display_name": "gemini-embedding-001", "modalities": { "input": [ - "text", - "image" + "text" ] }, "limit": { @@ -78874,47 +90033,39 @@ "supported": false }, "cost": { - "input": 2, - "output": 2, - "cache_read": 0 + "input": 0.15, + "output": 0.15 }, - "type": "imageGeneration" + "type": "embedding" }, { - "id": "V_2_TURBO", - "name": "V_2_TURBO", - "display_name": "V_2_TURBO", + "id": "gpt-oss-120b", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ - "text", - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131072, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 2, - "output": 2, - "cache_read": 0 + "input": 0.18, + "output": 0.9 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "V_2A", - "name": "V_2A", - "display_name": "V_2A", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "DeepSeek-R1-Distill-Qwen-32B", + "name": "DeepSeek-R1-Distill-Qwen-32B", + "display_name": "DeepSeek-R1-Distill-Qwen-32B", "limit": { "context": 8192, "output": 8192 @@ -78924,22 +90075,15 @@ "supported": false }, "cost": { - "input": 2, - "output": 2, - "cache_read": 0 + "input": 0.28, + "output": 0.84 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "V_2A_TURBO", - "name": "V_2A_TURBO", - "display_name": "V_2A_TURBO", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "DeepSeek-R1-Distill-Qwen-7B", + "name": "DeepSeek-R1-Distill-Qwen-7B", + "display_name": "DeepSeek-R1-Distill-Qwen-7B", "limit": { "context": 8192, "output": 8192 @@ -78949,22 +90093,15 @@ "supported": false }, "cost": { - "input": 2, - "output": 2, - "cache_read": 0 + "input": 0.06, + "output": 0.12 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "V_1", - "name": "V_1", - "display_name": "V_1", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "QwQ-32B", + "name": "QwQ-32B", + "display_name": "QwQ-32B", "limit": { "context": 8192, "output": 8192 @@ -78974,20 +90111,20 @@ "supported": false }, "cost": { - "input": 2, - "output": 2, - "cache_read": 0 + "input": 0.28, + "output": 0.84 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "V_1_TURBO", - "name": "V_1_TURBO", - "display_name": "V_1_TURBO", + "id": "Qwen2-VL-72B-Instruct", + "name": "Qwen2-VL-72B-Instruct", + "display_name": "Qwen2-VL-72B-Instruct", "modalities": { "input": [ "text", - "image" + "image", + "video" ] }, "limit": { @@ -78999,19 +90136,20 @@ "supported": false }, "cost": { - "input": 2, - "output": 2, - "cache_read": 0 + "input": 2.18, + "output": 6.54 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "doubao-embedding-large-text-240915", - "name": "doubao-embedding-large-text-240915", - "display_name": "doubao-embedding-large-text-240915", + "id": "Qwen2-VL-7B-Instruct", + "name": "Qwen2-VL-7B-Instruct", + "display_name": "Qwen2-VL-7B-Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "video" ] }, "limit": { @@ -79023,15 +90161,15 @@ "supported": false }, "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.28, + "output": 0.7 }, - "type": "embedding" + "type": "chat" }, { - "id": "kimi-thinking-preview", - "name": "kimi-thinking-preview", - "display_name": "kimi-thinking-preview", + "id": "cc-kimi-for-coding", + "name": "cc-kimi-for-coding", + "display_name": "cc-kimi-for-coding", "limit": { "context": 8192, "output": 8192 @@ -79041,15 +90179,16 @@ "supported": false }, "cost": { - "input": 30, - "output": 30 + "input": 0.2, + "output": 0.2, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "gpt-4o-2024-08-06", - "name": "gpt-4o-2024-08-06", - "display_name": "gpt-4o-2024-08-06", + "id": "Qwen/Qwen3-30B-A3B", + "name": "Qwen/Qwen3-30B-A3B", + "display_name": "Qwen/Qwen3-30B-A3B", "limit": { "context": 8192, "output": 8192 @@ -79059,40 +90198,15 @@ "supported": false }, "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 - }, - "type": "chat" - }, - { - "id": "AiHubmix-Phi-4-reasoning", - "name": "AiHubmix-Phi-4-reasoning", - "display_name": "AiHubmix-Phi-4-reasoning", - "modalities": { - "input": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 128000 - }, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 0.2, - "output": 0.2 + "input": 1, + "output": 1 }, "type": "chat" }, { - "id": "qwen-plus-2025-07-28", - "name": "qwen-plus-2025-07-28", - "display_name": "qwen-plus-2025-07-28", + "id": "Qwen/Qwen3-32B", + "name": "Qwen/Qwen3-32B", + "display_name": "Qwen/Qwen3-32B", "limit": { "context": 8192, "output": 8192 @@ -79102,16 +90216,15 @@ "supported": false }, "cost": { - "input": 0.11, - "output": 0.275, - "cache_read": 0.11 + "input": 0.4, + "output": 0.8 }, "type": "chat" }, { - "id": "qwen-plus-latest", - "name": "qwen-plus-latest", - "display_name": "qwen-plus-latest", + "id": "Qwen/Qwen3-14B", + "name": "Qwen/Qwen3-14B", + "display_name": "Qwen/Qwen3-14B", "limit": { "context": 8192, "output": 8192 @@ -79121,16 +90234,15 @@ "supported": false }, "cost": { - "input": 0.11, - "output": 0.275, - "cache_read": 0.11 + "input": 0.5, + "output": 0.5 }, "type": "chat" }, { - "id": "sonar", - "name": "sonar", - "display_name": "sonar", + "id": "Qwen/Qwen3-8B", + "name": "Qwen/Qwen3-8B", + "display_name": "Qwen/Qwen3-8B", "limit": { "context": 8192, "output": 8192 @@ -79140,15 +90252,23 @@ "supported": false }, "cost": { - "input": 1.6, - "output": 1.6 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "stepfun-ai/step3", - "name": "stepfun-ai/step3", - "display_name": "stepfun-ai/step3", + "id": "gemini-2.0-pro-exp-02-05-search", + "name": "gemini-2.0-pro-exp-02-05-search", + "display_name": "gemini-2.0-pro-exp-02-05-search", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -79158,105 +90278,116 @@ "supported": false }, "cost": { - "input": 1.1, - "output": 2.75 + "input": 1.25, + "output": 5 }, "type": "chat" }, { - "id": "text-embedding-v4", - "name": "text-embedding-v4", - "display_name": "text-embedding-v4", + "id": "embedding-2", + "name": "embedding-2", + "display_name": "embedding-2", "modalities": { "input": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 8000, + "output": 8000 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.08, - "output": 0.08 + "input": 0.0686, + "output": 0.0686 }, "type": "embedding" }, { - "id": "qwen-turbo-latest", - "name": "qwen-turbo-latest", - "display_name": "qwen-turbo-latest", + "id": "embedding-3", + "name": "embedding-3", + "display_name": "embedding-3", + "modalities": { + "input": [ + "text" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 8000, + "output": 8000 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.046, - "output": 0.92, - "cache_read": 0 + "input": 0.0686, + "output": 0.0686 }, - "type": "chat" + "type": "embedding" }, { - "id": "AiHubmix-Phi-4-mini-reasoning", - "name": "AiHubmix-Phi-4-mini-reasoning", - "display_name": "AiHubmix-Phi-4-mini-reasoning", + "id": "gemini-2.0-flash-search", + "name": "gemini-2.0-flash-search", + "display_name": "gemini-2.0-flash-search", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.12, - "output": 0.12 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "aihub-Phi-4-multimodal-instruct", - "name": "aihub-Phi-4-multimodal-instruct", - "display_name": "aihub-Phi-4-multimodal-instruct", + "id": "gemini-2.5-pro-preview-06-05", + "name": "gemini-2.5-pro-preview-06-05", + "display_name": "gemini-2.5-pro-preview-06-05", "modalities": { "input": [ "text", "image", - "audio" + "audio", + "video" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 1048576, + "output": 1048576 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.12, - "output": 0.48 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "qwen3-30b-a3b", - "name": "qwen3-30b-a3b", - "display_name": "qwen3-30b-a3b", + "id": "Aihubmix-MAI-DS-R1", + "name": "Aihubmix-MAI-DS-R1", + "display_name": "Aihubmix-MAI-DS-R1", "limit": { "context": 8192, "output": 8192 @@ -79266,16 +90397,22 @@ "supported": false }, "cost": { - "input": 0.12, - "output": 1.2, - "cache_read": 0 + "input": 0.6, + "output": 1.8 }, "type": "chat" }, { - "id": "qwen3-32b", - "name": "qwen3-32b", - "display_name": "qwen3-32b", + "id": "Qwen/Qwen2.5-VL-72B-Instruct", + "name": "Qwen/Qwen2.5-VL-72B-Instruct", + "display_name": "Qwen/Qwen2.5-VL-72B-Instruct", + "modalities": { + "input": [ + "text", + "image", + "video" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -79285,80 +90422,91 @@ "supported": false }, "cost": { - "input": 0.32, - "output": 3.2, + "input": 0.5, + "output": 0.5, "cache_read": 0 }, "type": "chat" }, { - "id": "grok-3", - "name": "grok-3", - "display_name": "grok-3", + "id": "o1", + "name": "o1", + "display_name": "o1", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 3, - "output": 15 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "aihub-Phi-4-mini-instruct", - "name": "aihub-Phi-4-mini-instruct", - "display_name": "aihub-Phi-4-mini-instruct", + "id": "o1-pro", + "name": "o1-pro", + "display_name": "o1-pro", "modalities": { "input": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.12, - "output": 0.48 + "input": 170, + "output": 680, + "cache_read": 170 }, "type": "chat" }, { - "id": "aihub-Phi-4", - "name": "aihub-Phi-4", - "display_name": "aihub-Phi-4", + "id": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "display_name": "ByteDance-Seed/Seed-OSS-36B-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { - "context": 16400, - "output": 16400 + "context": 256000, + "output": 256000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.12, - "output": 0.48 + "input": 0.2, + "output": 0.534 }, "type": "chat" }, { - "id": "claude-3-opus-20240229", - "name": "claude-3-opus-20240229", - "display_name": "claude-3-opus-20240229", + "id": "doubao-seed-1-6-250615", + "name": "doubao-seed-1-6-250615", + "display_name": "doubao-seed-1-6-250615", "limit": { "context": 8192, "output": 8192 @@ -79368,21 +90516,16 @@ "supported": false }, "cost": { - "input": 16.5, - "output": 82.5 + "input": 0.18, + "output": 2.52, + "cache_read": 0.036 }, "type": "chat" }, { - "id": "dall-e-3", - "name": "dall-e-3", - "display_name": "dall-e-3", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "doubao-seed-1-6-flash-250615", + "name": "doubao-seed-1-6-flash-250615", + "display_name": "doubao-seed-1-6-flash-250615", "limit": { "context": 8192, "output": 8192 @@ -79392,20 +90535,16 @@ "supported": false }, "cost": { - "input": 40, - "output": 40 + "input": 0.044, + "output": 0.44, + "cache_read": 0.0088 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "doubao-embedding-text-240715", - "name": "doubao-embedding-text-240715", - "display_name": "doubao-embedding-text-240715", - "modalities": { - "input": [ - "text" - ] - }, + "id": "doubao-seed-1-6-thinking-250615", + "name": "doubao-seed-1-6-thinking-250615", + "display_name": "doubao-seed-1-6-thinking-250615", "limit": { "context": 8192, "output": 8192 @@ -79415,15 +90554,16 @@ "supported": false }, "cost": { - "input": 0.7, - "output": 0.7 + "input": 0.18, + "output": 2.52, + "cache_read": 0.036 }, - "type": "embedding" + "type": "chat" }, { - "id": "qwen3-14b", - "name": "qwen3-14b", - "display_name": "qwen3-14b", + "id": "doubao-seed-1-6-vision-250815", + "name": "doubao-seed-1-6-vision-250815", + "display_name": "doubao-seed-1-6-vision-250815", "limit": { "context": 8192, "output": 8192 @@ -79433,16 +90573,16 @@ "supported": false }, "cost": { - "input": 0.16, - "output": 1.6, - "cache_read": 0 + "input": 0.10959, + "output": 1.0959, + "cache_read": 0.021918 }, "type": "chat" }, { - "id": "grok-3-beta", - "name": "grok-3-beta", - "display_name": "grok-3-beta", + "id": "Doubao-1.5-thinking-pro", + "name": "Doubao-1.5-thinking-pro", + "display_name": "Doubao-1.5-thinking-pro", "limit": { "context": 8192, "output": 8192 @@ -79452,35 +90592,39 @@ "supported": false }, "cost": { - "input": 3, - "output": 15, - "cache_read": 0 + "input": 0.62, + "output": 2.48, + "cache_read": 0.62 }, "type": "chat" }, { - "id": "grok-3-fast", - "name": "grok-3-fast", - "display_name": "grok-3-fast", + "id": "cc-minimax-m2", + "name": "cc-minimax-m2", + "display_name": "cc-minimax-m2", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 5.5, - "output": 27.5, - "cache_read": 0 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "qwen3-8b", - "name": "qwen3-8b", - "display_name": "qwen3-8b", + "id": "deepseek-ai/DeepSeek-Prover-V2-671B", + "name": "deepseek-ai/DeepSeek-Prover-V2-671B", + "display_name": "deepseek-ai/DeepSeek-Prover-V2-671B", "limit": { "context": 8192, "output": 8192 @@ -79490,16 +90634,20 @@ "supported": false }, "cost": { - "input": 0.08, - "output": 0.8, - "cache_read": 0 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "qwen3-4b", - "name": "qwen3-4b", - "display_name": "qwen3-4b", + "id": "gemini-2.5-flash-preview-tts", + "name": "gemini-2.5-flash-preview-tts", + "display_name": "gemini-2.5-flash-preview-tts", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -79509,16 +90657,20 @@ "supported": false }, "cost": { - "input": 0.046, - "output": 0.46, + "input": 0.5, + "output": 0.5, "cache_read": 0 - }, - "type": "chat" + } }, { - "id": "deepseek-ai/DeepSeek-R1-Zero", - "name": "deepseek-ai/DeepSeek-R1-Zero", - "display_name": "deepseek-ai/DeepSeek-R1-Zero", + "id": "gemini-2.5-pro-preview-tts", + "name": "gemini-2.5-pro-preview-tts", + "display_name": "gemini-2.5-pro-preview-tts", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -79528,15 +90680,15 @@ "supported": false }, "cost": { - "input": 2.2, - "output": 2.2 - }, - "type": "chat" + "input": 1, + "output": 1, + "cache_read": 0 + } }, { - "id": "grok-3-fast-beta", - "name": "grok-3-fast-beta", - "display_name": "grok-3-fast-beta", + "id": "gemma-3-12b-it", + "name": "gemma-3-12b-it", + "display_name": "gemma-3-12b-it", "limit": { "context": 8192, "output": 8192 @@ -79546,16 +90698,16 @@ "supported": false }, "cost": { - "input": 5.5, - "output": 27.5, + "input": 0.2, + "output": 0.2, "cache_read": 0 }, "type": "chat" }, { - "id": "grok-3-mini", - "name": "grok-3-mini", - "display_name": "grok-3-mini", + "id": "gemma-3-27b-it", + "name": "gemma-3-27b-it", + "display_name": "gemma-3-27b-it", "limit": { "context": 8192, "output": 8192 @@ -79565,16 +90717,16 @@ "supported": false }, "cost": { - "input": 0.3, - "output": 0.501, + "input": 0.2, + "output": 0.2, "cache_read": 0 }, "type": "chat" }, { - "id": "grok-3-mini-beta", - "name": "grok-3-mini-beta", - "display_name": "grok-3-mini-beta", + "id": "gemma-3-4b-it", + "name": "gemma-3-4b-it", + "display_name": "gemma-3-4b-it", "limit": { "context": 8192, "output": 8192 @@ -79584,16 +90736,16 @@ "supported": false }, "cost": { - "input": 0.33, - "output": 0.5511, + "input": 0.2, + "output": 0.2, "cache_read": 0 }, "type": "chat" }, { - "id": "qwen3-1.7b", - "name": "qwen3-1.7b", - "display_name": "qwen3-1.7b", + "id": "gemma-3n-e4b-it", + "name": "gemma-3n-e4b-it", + "display_name": "gemma-3n-e4b-it", "limit": { "context": 8192, "output": 8192 @@ -79603,16 +90755,22 @@ "supported": false }, "cost": { - "input": 0.046, - "output": 0.46, + "input": 0.2, + "output": 0.2, "cache_read": 0 }, "type": "chat" }, { - "id": "qwen3-0.6b", - "name": "qwen3-0.6b", - "display_name": "qwen3-0.6b", + "id": "gpt-4o-image-vip", + "name": "gpt-4o-image-vip", + "display_name": "gpt-4o-image-vip", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -79622,16 +90780,22 @@ "supported": false }, "cost": { - "input": 0.046, - "output": 0.46, + "input": 7, + "output": 7, "cache_read": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "qwen-3-32b", - "name": "qwen-3-32b", - "display_name": "qwen-3-32b", + "id": "gpt-4o-image", + "name": "gpt-4o-image", + "display_name": "gpt-4o-image", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -79641,15 +90805,16 @@ "supported": false }, "cost": { - "input": 0.4, - "output": 1.6 + "input": 3, + "output": 3, + "cache_read": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "qwen-turbo-2025-04-28", - "name": "qwen-turbo-2025-04-28", - "display_name": "qwen-turbo-2025-04-28", + "id": "gemma-3-1b-it", + "name": "gemma-3-1b-it", + "display_name": "gemma-3-1b-it", "limit": { "context": 8192, "output": 8192 @@ -79659,37 +90824,43 @@ "supported": false }, "cost": { - "input": 0.046, - "output": 0.92, + "input": 0.2, + "output": 0.2, "cache_read": 0 }, "type": "chat" }, { - "id": "grok-3-mini-fast-beta", - "name": "grok-3-mini-fast-beta", - "display_name": "grok-3-mini-fast-beta", + "id": "deepseek-r1-distill-llama-70b", + "name": "deepseek-r1-distill-llama-70b", + "display_name": "deepseek-r1-distill-llama-70b", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.33, - "output": 2.20011 + "input": 0.8, + "output": 1.6 }, "type": "chat" }, { - "id": "command-a-03-2025", - "name": "command-a-03-2025", - "display_name": "command-a-03-2025", + "id": "gpt-4o-mini-tts", + "name": "gpt-4o-mini-tts", + "display_name": "gpt-4o-mini-tts", "modalities": { "input": [ - "text" + "audio" ] }, "limit": { @@ -79701,16 +90872,23 @@ "supported": false }, "cost": { - "input": 2.5, - "output": 10, - "cache_read": 0 - }, - "type": "chat" + "input": 0.6, + "output": 12, + "cache_read": 0.6 + } }, { - "id": "qwen-plus-2025-04-28", - "name": "qwen-plus-2025-04-28", - "display_name": "qwen-plus-2025-04-28", + "id": "gemini-2.0-flash-exp", + "name": "gemini-2.0-flash-exp", + "display_name": "gemini-2.0-flash-exp", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -79720,16 +90898,15 @@ "supported": false }, "cost": { - "input": 0.13, - "output": 2.6, - "cache_read": 0 + "input": 0.02, + "output": 0.08 }, "type": "chat" }, { - "id": "THUDM/GLM-Z1-32B-0414", - "name": "THUDM/GLM-Z1-32B-0414", - "display_name": "THUDM/GLM-Z1-32B-0414", + "id": "tngtech/DeepSeek-R1T-Chimera", + "name": "tngtech/DeepSeek-R1T-Chimera", + "display_name": "tngtech/DeepSeek-R1T-Chimera", "limit": { "context": 8192, "output": 8192 @@ -79739,53 +90916,65 @@ "supported": false }, "cost": { - "input": 0.08, - "output": 0.08 + "input": 0.02, + "output": 0.02 }, "type": "chat" }, { - "id": "Pro/THUDM/GLM-4.1V-9B-Thinking", - "name": "Pro/THUDM/GLM-4.1V-9B-Thinking", - "display_name": "Pro/THUDM/GLM-4.1V-9B-Thinking", + "id": "claude-3-5-sonnet", + "name": "claude-3-5-sonnet", + "display_name": "claude-3-5-sonnet", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 200000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.04, - "output": 0.16, - "cache_read": 0 + "input": 3.3, + "output": 16.5 }, "type": "chat" }, { - "id": "THUDM/GLM-4.1V-9B-Thinking", - "name": "THUDM/GLM-4.1V-9B-Thinking", - "display_name": "THUDM/GLM-4.1V-9B-Thinking", + "id": "o1-preview", + "name": "o1-preview", + "display_name": "o1-preview", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.1, - "output": 0.1, - "cache_read": 0 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "text-embedding-004", - "name": "text-embedding-004", - "display_name": "text-embedding-004", + "id": "o1-mini", + "name": "o1-mini", + "display_name": "o1-mini", "limit": { "context": 8192, "output": 8192 @@ -79795,69 +90984,99 @@ "supported": false }, "cost": { - "input": 0.02, - "output": 0.02 + "input": 3, + "output": 12, + "cache_read": 1.5 }, "type": "chat" }, { - "id": "THUDM/GLM-4-32B-0414", - "name": "THUDM/GLM-4-32B-0414", - "display_name": "THUDM/GLM-4-32B-0414", + "id": "gemini-2.0-flash-thinking-exp-01-21", + "name": "gemini-2.0-flash-thinking-exp-01-21", + "display_name": "gemini-2.0-flash-thinking-exp-01-21", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ] + }, "limit": { "context": 8192, "output": 8192 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.08, - "output": 0.08 + "input": 0.076, + "output": 0.304 }, "type": "chat" }, { - "id": "THUDM/GLM-Z1-9B-0414", - "name": "THUDM/GLM-Z1-9B-0414", - "display_name": "THUDM/GLM-Z1-9B-0414", + "id": "gpt-4o-2024-11-20", + "name": "gpt-4o-2024-11-20", + "display_name": "gpt-4o-2024-11-20", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 128000 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.05, - "output": 0.05 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "THUDM/GLM-4-9B-0414", - "name": "THUDM/GLM-4-9B-0414", - "display_name": "THUDM/GLM-4-9B-0414", + "id": "gpt-4o", + "name": "gpt-4o", + "display_name": "gpt-4o", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.05, - "output": 0.05 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "cc-doubao-seed-code-preview-latest", - "name": "cc-doubao-seed-code-preview-latest", - "display_name": "cc-doubao-seed-code-preview-latest", + "id": "chatgpt-4o-latest", + "name": "chatgpt-4o-latest", + "display_name": "chatgpt-4o-latest", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -79867,33 +91086,40 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.2 + "input": 5, + "output": 15 }, "type": "chat" }, { - "id": "doubao-seed-code-preview-latest", - "name": "doubao-seed-code-preview-latest", - "display_name": "doubao-seed-code-preview-latest", + "id": "gpt-4o-mini", + "name": "gpt-4o-mini", + "display_name": "gpt-4o-mini", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 128000 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "deepseek-ai/Janus-Pro-7B", - "name": "deepseek-ai/Janus-Pro-7B", - "display_name": "deepseek-ai/Janus-Pro-7B", + "id": "AiHubmix-mistral-medium", + "name": "AiHubmix-mistral-medium", + "display_name": "AiHubmix-mistral-medium", "limit": { "context": 8192, "output": 8192 @@ -79903,15 +91129,23 @@ "supported": false }, "cost": { - "input": 2, + "input": 0.4, "output": 2 }, "type": "chat" }, { - "id": "qwen-3-235b-a22b-instruct-2507", - "name": "qwen-3-235b-a22b-instruct-2507", - "display_name": "qwen-3-235b-a22b-instruct-2507", + "id": "gemini-2.0-pro-exp-02-05", + "name": "gemini-2.0-pro-exp-02-05", + "display_name": "gemini-2.0-pro-exp-02-05", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -79921,15 +91155,15 @@ "supported": false }, "cost": { - "input": 0.28, - "output": 1.4 + "input": 1.25, + "output": 5 }, "type": "chat" }, { - "id": "glm-zero-preview", - "name": "glm-zero-preview", - "display_name": "glm-zero-preview", + "id": "ernie-x1.1-preview", + "name": "ernie-x1.1-preview", + "display_name": "ernie-x1.1-preview", "limit": { "context": 8192, "output": 8192 @@ -79939,74 +91173,80 @@ "supported": false }, "cost": { - "input": 2, - "output": 2 + "input": 0.136, + "output": 0.544 }, "type": "chat" }, { - "id": "gemini-2.0-flash-thinking-exp-1219", - "name": "gemini-2.0-flash-thinking-exp-1219", - "display_name": "gemini-2.0-flash-thinking-exp-1219", + "id": "minimax-m2", + "name": "minimax-m2", + "display_name": "minimax-m2", + "modalities": { + "input": [ + "text" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 204800, + "output": 204800 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.076, - "output": 0.304 + "input": 0.288, + "output": 1.152 }, "type": "chat" }, { - "id": "glm-4.5-air", - "name": "glm-4.5-air", - "display_name": "glm-4.5-air", + "id": "ERNIE-X1.1-Preview", + "name": "ERNIE-X1.1-Preview", + "display_name": "ERNIE-X1.1-Preview", "modalities": { "input": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 119000, + "output": 119000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.14, - "output": 0.84 + "input": 0.136, + "output": 0.544 }, "type": "chat" }, { - "id": "gpt-4-32k", - "name": "gpt-4-32k", - "display_name": "gpt-4-32k", + "id": "Qwen/QwQ-32B", + "name": "Qwen/QwQ-32B", + "display_name": "Qwen/QwQ-32B", "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 60, - "output": 120 + "input": 0.14, + "output": 0.56 }, "type": "chat" }, { - "id": "nvidia-llama-3.1-nemotron-70b-instruct", - "name": "nvidia-llama-3.1-nemotron-70b-instruct", - "display_name": "nvidia-llama-3.1-nemotron-70b-instruct", + "id": "chutesai/Mistral-Small-3.1-24B-Instruct-2503", + "name": "chutesai/Mistral-Small-3.1-24B-Instruct-2503", + "display_name": "chutesai/Mistral-Small-3.1-24B-Instruct-2503", "limit": { "context": 8192, "output": 8192 @@ -80016,15 +91256,15 @@ "supported": false }, "cost": { - "input": 1.32, - "output": 1.32 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "nvidia-llama-3.3-nemotron-super-49b-v1.5", - "name": "nvidia-llama-3.3-nemotron-super-49b-v1.5", - "display_name": "nvidia-llama-3.3-nemotron-super-49b-v1.5", + "id": "MiniMaxAI/MiniMax-M1-80k", + "name": "MiniMaxAI/MiniMax-M1-80k", + "display_name": "MiniMaxAI/MiniMax-M1-80k", "limit": { "context": 8192, "output": 8192 @@ -80034,92 +91274,113 @@ "supported": false }, "cost": { - "input": 0.11, - "output": 0.44 + "input": 0.6, + "output": 2.4 }, "type": "chat" }, { - "id": "nvidia-nemotron-3-nano-30b-a3b", - "name": "nvidia-nemotron-3-nano-30b-a3b", - "display_name": "nvidia-nemotron-3-nano-30b-a3b", + "id": "Qwen/Qwen2.5-VL-32B-Instruct", + "name": "Qwen/Qwen2.5-VL-32B-Instruct", + "display_name": "Qwen/Qwen2.5-VL-32B-Instruct", + "modalities": { + "input": [ + "text", + "image", + "video" + ] + }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.066, - "output": 0.264 + "input": 0.24, + "output": 0.24 }, "type": "chat" }, { - "id": "nvidia-nemotron-nano-12b-v2-vl", - "name": "nvidia-nemotron-nano-12b-v2-vl", - "display_name": "nvidia-nemotron-nano-12b-v2-vl", + "id": "baidu/ERNIE-4.5-300B-A47B", + "name": "baidu/ERNIE-4.5-300B-A47B", + "display_name": "baidu/ERNIE-4.5-300B-A47B", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.22, - "output": 0.66 + "input": 0.32, + "output": 1.28, + "cache_read": 0 }, "type": "chat" }, { - "id": "nvidia-nemotron-nano-9b-v2", - "name": "nvidia-nemotron-nano-9b-v2", - "display_name": "nvidia-nemotron-nano-9b-v2", + "id": "bge-large-en", + "name": "bge-large-en", + "display_name": "bge-large-en", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.044, - "output": 0.176 + "input": 0.068, + "output": 0.068 }, - "type": "chat" + "type": "embedding" }, { - "id": "coding-glm-4.5-air", - "name": "coding-glm-4.5-air", - "display_name": "coding-glm-4.5-air", + "id": "bge-large-zh", + "name": "bge-large-zh", + "display_name": "bge-large-zh", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.014, - "output": 0.084 + "input": 0.068, + "output": 0.068 }, - "type": "chat" + "type": "embedding" }, { - "id": "o1-preview-2024-09-12", - "name": "o1-preview-2024-09-12", - "display_name": "o1-preview-2024-09-12", + "id": "codestral-latest", + "name": "codestral-latest", + "display_name": "codestral-latest", "limit": { "context": 8192, "output": 8192 @@ -80129,16 +91390,15 @@ "supported": false }, "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0.4, + "output": 1.2 }, "type": "chat" }, { - "id": "Qwen/QVQ-72B-Preview", - "name": "Qwen/QVQ-72B-Preview", - "display_name": "Qwen/QVQ-72B-Preview", + "id": "moonshotai/Kimi-Dev-72B", + "name": "moonshotai/Kimi-Dev-72B", + "display_name": "moonshotai/Kimi-Dev-72B", "limit": { "context": 8192, "output": 8192 @@ -80148,15 +91408,16 @@ "supported": false }, "cost": { - "input": 1.2, - "output": 1.2 + "input": 0.32, + "output": 1.28, + "cache_read": 0 }, "type": "chat" }, { - "id": "Qwen/QwQ-32B-Preview", - "name": "Qwen/QwQ-32B-Preview", - "display_name": "Qwen/QwQ-32B-Preview", + "id": "moonshotai/Moonlight-16B-A3B-Instruct", + "name": "moonshotai/Moonlight-16B-A3B-Instruct", + "display_name": "moonshotai/Moonlight-16B-A3B-Instruct", "limit": { "context": 8192, "output": 8192 @@ -80166,15 +91427,16 @@ "supported": false }, "cost": { - "input": 0.16, - "output": 0.16 + "input": 0.2, + "output": 0.2, + "cache_read": 0 }, "type": "chat" }, { - "id": "llama-3.1-sonar-huge-128k-online", - "name": "llama-3.1-sonar-huge-128k-online", - "display_name": "llama-3.1-sonar-huge-128k-online", + "id": "o1-global", + "name": "o1-global", + "display_name": "o1-global", "limit": { "context": 8192, "output": 8192 @@ -80184,15 +91446,16 @@ "supported": false }, "cost": { - "input": 5.6, - "output": 5.6 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "llama-3.1-sonar-large-128k-online", - "name": "llama-3.1-sonar-large-128k-online", - "display_name": "llama-3.1-sonar-large-128k-online", + "id": "qianfan-qi-vl", + "name": "qianfan-qi-vl", + "display_name": "qianfan-qi-vl", "limit": { "context": 8192, "output": 8192 @@ -80202,15 +91465,21 @@ "supported": false }, "cost": { - "input": 1.2, - "output": 1.2 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "aihubmix-Mistral-Large-2411", - "name": "aihubmix-Mistral-Large-2411", - "display_name": "aihubmix-Mistral-Large-2411", + "id": "qwen2.5-vl-72b-instruct", + "name": "qwen2.5-vl-72b-instruct", + "display_name": "qwen2.5-vl-72b-instruct", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -80220,15 +91489,15 @@ "supported": false }, "cost": { - "input": 2, - "output": 6 + "input": 2.4, + "output": 7.2 }, "type": "chat" }, { - "id": "aihubmix-Mistral-large-2407", - "name": "aihubmix-Mistral-large-2407", - "display_name": "aihubmix-Mistral-large-2407", + "id": "tencent/Hunyuan-A13B-Instruct", + "name": "tencent/Hunyuan-A13B-Instruct", + "display_name": "tencent/Hunyuan-A13B-Instruct", "limit": { "context": 8192, "output": 8192 @@ -80238,15 +91507,15 @@ "supported": false }, "cost": { - "input": 3, - "output": 9 + "input": 0.14, + "output": 0.56 }, "type": "chat" }, { - "id": "grok-2-1212", - "name": "grok-2-1212", - "display_name": "grok-2-1212", + "id": "unsloth/gemma-3-27b-it", + "name": "unsloth/gemma-3-27b-it", + "display_name": "unsloth/gemma-3-27b-it", "limit": { "context": 8192, "output": 8192 @@ -80256,70 +91525,88 @@ "supported": false }, "cost": { - "input": 1.8, - "output": 9 + "input": 0.22, + "output": 0.22, + "cache_read": 0 }, "type": "chat" }, { - "id": "llama-3.1-70b", - "name": "llama-3.1-70b", - "display_name": "llama-3.1-70b", + "id": "ernie-4.5-0.3b", + "name": "ernie-4.5-0.3b", + "display_name": "ernie-4.5-0.3b", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.44, - "output": 0.44 + "input": 0.0136, + "output": 0.0544 }, "type": "chat" }, { - "id": "gemini-2.0-flash-thinking-exp", - "name": "gemini-2.0-flash-thinking-exp", - "display_name": "gemini-2.0-flash-thinking-exp", + "id": "ernie-4.5-turbo-128k-preview", + "name": "ernie-4.5-turbo-128k-preview", + "display_name": "ernie-4.5-turbo-128k-preview", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.076, - "output": 0.304 + "input": 0.108, + "output": 0.432 }, "type": "chat" }, { - "id": "gpt-image-test", - "name": "gpt-image-test", - "display_name": "gpt-image-test", + "id": "ernie-x1-turbo", + "name": "ernie-x1-turbo", + "display_name": "ernie-x1-turbo", + "modalities": { + "input": [ + "text" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 50500, + "output": 50500 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 5, - "output": 40, - "cache_read": 0 + "input": 0.136, + "output": 0.544 }, "type": "chat" }, { - "id": "imagen-3.0-generate-002", - "name": "imagen-3.0-generate-002", - "display_name": "imagen-3.0-generate-002", + "id": "gemini-2.0-flash-exp-search", + "name": "gemini-2.0-flash-exp-search", + "display_name": "gemini-2.0-flash-exp-search", "modalities": { "input": [ "text", @@ -80330,21 +91617,61 @@ "context": 8192, "output": 8192 }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.1, + "output": 0.4 + }, + "type": "chat" + }, + { + "id": "kat-dev", + "name": "kat-dev", + "display_name": "kat-dev", + "modalities": { + "input": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.137, + "output": 0.548 + }, + "type": "chat" + }, + { + "id": "llama-3.3-70b", + "name": "llama-3.3-70b", + "display_name": "llama-3.3-70b", + "limit": { + "context": 65536, + "output": 65536 + }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 2, - "output": 2, - "cache_read": 0 + "input": 0.6, + "output": 0.6 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "llama3.1-8b", - "name": "llama3.1-8b", - "display_name": "llama3.1-8b", + "id": "gemini-exp-1206", + "name": "gemini-exp-1206", + "display_name": "gemini-exp-1206", "limit": { "context": 8192, "output": 8192 @@ -80354,15 +91681,15 @@ "supported": false }, "cost": { - "input": 0.3, - "output": 0.6 + "input": 1.25, + "output": 5 }, "type": "chat" }, { - "id": "DESCRIBE", - "name": "DESCRIBE", - "display_name": "DESCRIBE", + "id": "gpt-4o-zh", + "name": "gpt-4o-zh", + "display_name": "gpt-4o-zh", "modalities": { "input": [ "text", @@ -80378,22 +91705,33 @@ "supported": false }, "cost": { - "input": 2, - "output": 2, - "cache_read": 0 + "input": 2.5, + "output": 10 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "UPSCALE", - "name": "UPSCALE", - "display_name": "UPSCALE", - "modalities": { - "input": [ - "text", - "image" - ] + "id": "qwen-qwq-32b", + "name": "qwen-qwq-32b", + "display_name": "qwen-qwq-32b", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.4, + "output": 0.8 }, + "type": "chat" + }, + { + "id": "unsloth/gemma-3-12b-it", + "name": "unsloth/gemma-3-12b-it", + "display_name": "unsloth/gemma-3-12b-it", "limit": { "context": 8192, "output": 8192 @@ -80403,16 +91741,16 @@ "supported": false }, "cost": { - "input": 2, - "output": 2, + "input": 0.2, + "output": 0.8, "cache_read": 0 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "bai-qwen3-vl-235b-a22b-instruct", - "name": "bai-qwen3-vl-235b-a22b-instruct", - "display_name": "bai-qwen3-vl-235b-a22b-instruct", + "id": "qwen-max-0125", + "name": "qwen-max-0125", + "display_name": "qwen-max-0125", "limit": { "context": 8192, "output": 8192 @@ -80422,59 +91760,67 @@ "supported": false }, "cost": { - "input": 0.274, - "output": 1.096 + "input": 0.38, + "output": 1.52 }, "type": "chat" }, { - "id": "cc-MiniMax-M2", - "name": "cc-MiniMax-M2", - "display_name": "cc-MiniMax-M2", + "id": "claude-3-5-haiku", + "name": "claude-3-5-haiku", + "display_name": "claude-3-5-haiku", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 200000 }, "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.1, - "output": 0.1 + "input": 1.1, + "output": 5.5 }, "type": "chat" }, { - "id": "cc-deepseek-v3", - "name": "cc-deepseek-v3", - "display_name": "cc-deepseek-v3", + "id": "BAAI/bge-large-en-v1.5", + "name": "BAAI/bge-large-en-v1.5", + "display_name": "BAAI/bge-large-en-v1.5", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.3, - "output": 0.3 + "input": 0.034, + "output": 0.034 }, - "type": "chat" + "type": "embedding" }, { - "id": "cc-deepseek-v3.1", - "name": "cc-deepseek-v3.1", - "display_name": "cc-deepseek-v3.1", + "id": "BAAI/bge-large-zh-v1.5", + "name": "BAAI/bge-large-zh-v1.5", + "display_name": "BAAI/bge-large-zh-v1.5", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { @@ -80486,15 +91832,15 @@ "supported": false }, "cost": { - "input": 0.56, - "output": 1.68 + "input": 0.034, + "output": 0.034 }, - "type": "chat" + "type": "embedding" }, { - "id": "cc-ernie-4.5-300b-a47b", - "name": "cc-ernie-4.5-300b-a47b", - "display_name": "cc-ernie-4.5-300b-a47b", + "id": "BAAI/bge-reranker-v2-m3", + "name": "BAAI/bge-reranker-v2-m3", + "display_name": "BAAI/bge-reranker-v2-m3", "modalities": { "input": [ "text", @@ -80505,21 +91851,20 @@ "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.32, - "output": 1.28, - "cache_read": 0 + "input": 0.034, + "output": 0.034 }, - "type": "chat" + "type": "rerank" }, { - "id": "cc-kimi-dev-72b", - "name": "cc-kimi-dev-72b", - "display_name": "cc-kimi-dev-72b", + "id": "tencent/Hunyuan-MT-7B", + "name": "tencent/Hunyuan-MT-7B", + "display_name": "tencent/Hunyuan-MT-7B", "limit": { "context": 8192, "output": 8192 @@ -80529,62 +91874,59 @@ "supported": false }, "cost": { - "input": 0.32, - "output": 1.28, - "cache_read": 0 + "input": 0.2, + "output": 0.2 }, "type": "chat" - }, - { - "id": "cc-kimi-k2-instruct", - "name": "cc-kimi-k2-instruct", - "display_name": "cc-kimi-k2-instruct", - "modalities": { - "input": [ - "text" - ] - }, + }, + { + "id": "gemini-2.0-flash-lite-preview-02-05", + "name": "gemini-2.0-flash-lite-preview-02-05", + "display_name": "gemini-2.0-flash-lite-preview-02-05", "limit": { "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 1.1, - "output": 3.3 + "input": 0.075, + "output": 0.3, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "cc-kimi-k2-instruct-0905", - "name": "cc-kimi-k2-instruct-0905", - "display_name": "cc-kimi-k2-instruct-0905", + "id": "V3", + "name": "V3", + "display_name": "V3", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 1.1, - "output": 3.3 + "input": 2, + "output": 2, + "cache_read": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "cc-kimi-k2-thinking", - "name": "cc-kimi-k2-thinking", - "display_name": "cc-kimi-k2-thinking", + "id": "sonar-reasoning", + "name": "sonar-reasoning", + "display_name": "sonar-reasoning", "limit": { "context": 8192, "output": 8192 @@ -80594,15 +91936,21 @@ "supported": false }, "cost": { - "input": 0.548, - "output": 2.192 + "input": 1.6, + "output": 8 }, "type": "chat" }, { - "id": "computer-use-preview", - "name": "computer-use-preview", - "display_name": "computer-use-preview", + "id": "V_2", + "name": "V_2", + "display_name": "V_2", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -80612,15 +91960,22 @@ "supported": false }, "cost": { - "input": 3, - "output": 12 + "input": 2, + "output": 2, + "cache_read": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "crush-glm-4.6-free", - "name": "crush-glm-4.6-free", - "display_name": "crush-glm-4.6-free", + "id": "V_2_TURBO", + "name": "V_2_TURBO", + "display_name": "V_2_TURBO", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -80630,15 +91985,16 @@ "supported": false }, "cost": { - "input": 0, - "output": 0 + "input": 2, + "output": 2, + "cache_read": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "o1-2024-12-17", - "name": "o1-2024-12-17", - "display_name": "o1-2024-12-17", + "id": "V_2A", + "name": "V_2A", + "display_name": "V_2A", "modalities": { "input": [ "text", @@ -80651,20 +92007,25 @@ }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 2, + "output": 2, + "cache_read": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "sf-kimi-k2-thinking", - "name": "sf-kimi-k2-thinking", - "display_name": "sf-kimi-k2-thinking", + "id": "V_2A_TURBO", + "name": "V_2A_TURBO", + "display_name": "V_2A_TURBO", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -80674,15 +92035,22 @@ "supported": false }, "cost": { - "input": 0.548, - "output": 2.192 + "input": 2, + "output": 2, + "cache_read": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "o1-mini-2024-09-12", - "name": "o1-mini-2024-09-12", - "display_name": "o1-mini-2024-09-12", + "id": "V_1", + "name": "V_1", + "display_name": "V_1", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -80692,16 +92060,22 @@ "supported": false }, "cost": { - "input": 3, - "output": 12, - "cache_read": 1.5 + "input": 2, + "output": 2, + "cache_read": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "omni-moderation-latest", - "name": "omni-moderation-latest", - "display_name": "omni-moderation-latest", + "id": "V_1_TURBO", + "name": "V_1_TURBO", + "display_name": "V_1_TURBO", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -80711,15 +92085,21 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.2 + "input": 2, + "output": 2, + "cache_read": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "qwen-flash", - "name": "qwen-flash", - "display_name": "qwen-flash", + "id": "doubao-embedding-large-text-240915", + "name": "doubao-embedding-large-text-240915", + "display_name": "doubao-embedding-large-text-240915", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -80729,16 +92109,15 @@ "supported": false }, "cost": { - "input": 0.02, - "output": 0.2, - "cache_read": 0.02 + "input": 0.1, + "output": 0.1 }, - "type": "chat" + "type": "embedding" }, { - "id": "qwen-flash-2025-07-28", - "name": "qwen-flash-2025-07-28", - "display_name": "qwen-flash-2025-07-28", + "id": "kimi-thinking-preview", + "name": "kimi-thinking-preview", + "display_name": "kimi-thinking-preview", "limit": { "context": 8192, "output": 8192 @@ -80748,16 +92127,15 @@ "supported": false }, "cost": { - "input": 0.02, - "output": 0.2, - "cache_read": 0.02 + "input": 30, + "output": 30 }, "type": "chat" }, { - "id": "qwen-long", - "name": "qwen-long", - "display_name": "qwen-long", + "id": "gpt-4o-2024-08-06", + "name": "gpt-4o-2024-08-06", + "display_name": "gpt-4o-2024-08-06", "limit": { "context": 8192, "output": 8192 @@ -80767,33 +92145,40 @@ "supported": false }, "cost": { - "input": 0.1, - "output": 0.4 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "qwen-max", - "name": "qwen-max", - "display_name": "qwen-max", + "id": "AiHubmix-Phi-4-reasoning", + "name": "AiHubmix-Phi-4-reasoning", + "display_name": "AiHubmix-Phi-4-reasoning", + "modalities": { + "input": [ + "text" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 128000 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.38, - "output": 1.52 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "qwen-max-longcontext", - "name": "qwen-max-longcontext", - "display_name": "qwen-max-longcontext", + "id": "qwen-plus-2025-07-28", + "name": "qwen-plus-2025-07-28", + "display_name": "qwen-plus-2025-07-28", "limit": { "context": 8192, "output": 8192 @@ -80803,15 +92188,16 @@ "supported": false }, "cost": { - "input": 7, - "output": 21 + "input": 0.11, + "output": 0.275, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "qwen-plus", - "name": "qwen-plus", - "display_name": "qwen-plus", + "id": "qwen-plus-latest", + "name": "qwen-plus-latest", + "display_name": "qwen-plus-latest", "limit": { "context": 8192, "output": 8192 @@ -80821,20 +92207,16 @@ "supported": false }, "cost": { - "input": 0.7, - "output": 2.1 + "input": 0.11, + "output": 0.275, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "qwen-turbo", - "name": "qwen-turbo", - "display_name": "qwen-turbo", - "modalities": { - "input": [ - "text" - ] - }, + "id": "sonar", + "name": "sonar", + "display_name": "sonar", "limit": { "context": 8192, "output": 8192 @@ -80844,20 +92226,15 @@ "supported": false }, "cost": { - "input": 0.36, - "output": 1.08 + "input": 1.6, + "output": 1.6 }, "type": "chat" }, { - "id": "qwen-turbo-2024-11-01", - "name": "qwen-turbo-2024-11-01", - "display_name": "qwen-turbo-2024-11-01", - "modalities": { - "input": [ - "text" - ] - }, + "id": "stepfun-ai/step3", + "name": "stepfun-ai/step3", + "display_name": "stepfun-ai/step3", "limit": { "context": 8192, "output": 8192 @@ -80867,15 +92244,20 @@ "supported": false }, "cost": { - "input": 0.36, - "output": 1.08 + "input": 1.1, + "output": 2.75 }, "type": "chat" }, { - "id": "qwen2.5-14b-instruct", - "name": "qwen2.5-14b-instruct", - "display_name": "qwen2.5-14b-instruct", + "id": "text-embedding-v4", + "name": "text-embedding-v4", + "display_name": "text-embedding-v4", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -80885,15 +92267,15 @@ "supported": false }, "cost": { - "input": 0.4, - "output": 1.2 + "input": 0.08, + "output": 0.08 }, - "type": "chat" + "type": "embedding" }, { - "id": "qwen2.5-32b-instruct", - "name": "qwen2.5-32b-instruct", - "display_name": "qwen2.5-32b-instruct", + "id": "qwen-turbo-latest", + "name": "qwen-turbo-latest", + "display_name": "qwen-turbo-latest", "limit": { "context": 8192, "output": 8192 @@ -80903,51 +92285,64 @@ "supported": false }, "cost": { - "input": 0.6, - "output": 1.2 + "input": 0.046, + "output": 0.92, + "cache_read": 0 }, "type": "chat" }, { - "id": "qwen2.5-3b-instruct", - "name": "qwen2.5-3b-instruct", - "display_name": "qwen2.5-3b-instruct", + "id": "AiHubmix-Phi-4-mini-reasoning", + "name": "AiHubmix-Phi-4-mini-reasoning", + "display_name": "AiHubmix-Phi-4-mini-reasoning", + "modalities": { + "input": [ + "text" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 128000 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.4, - "output": 0.8 + "input": 0.12, + "output": 0.12 }, "type": "chat" }, { - "id": "qwen2.5-72b-instruct", - "name": "qwen2.5-72b-instruct", - "display_name": "qwen2.5-72b-instruct", + "id": "aihub-Phi-4-multimodal-instruct", + "name": "aihub-Phi-4-multimodal-instruct", + "display_name": "aihub-Phi-4-multimodal-instruct", + "modalities": { + "input": [ + "text", + "image", + "audio" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 128000 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.8, - "output": 2.4 + "input": 0.12, + "output": 0.48 }, "type": "chat" }, { - "id": "qwen2.5-7b-instruct", - "name": "qwen2.5-7b-instruct", - "display_name": "qwen2.5-7b-instruct", + "id": "qwen3-30b-a3b", + "name": "qwen3-30b-a3b", + "display_name": "qwen3-30b-a3b", "limit": { "context": 8192, "output": 8192 @@ -80957,15 +92352,16 @@ "supported": false }, "cost": { - "input": 0.4, - "output": 0.8 + "input": 0.12, + "output": 1.2, + "cache_read": 0 }, "type": "chat" }, { - "id": "qwen2.5-coder-1.5b-instruct", - "name": "qwen2.5-coder-1.5b-instruct", - "display_name": "qwen2.5-coder-1.5b-instruct", + "id": "qwen3-32b", + "name": "qwen3-32b", + "display_name": "qwen3-32b", "limit": { "context": 8192, "output": 8192 @@ -80975,15 +92371,16 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.4 + "input": 0.32, + "output": 3.2, + "cache_read": 0 }, "type": "chat" }, { - "id": "qwen2.5-coder-7b-instruct", - "name": "qwen2.5-coder-7b-instruct", - "display_name": "qwen2.5-coder-7b-instruct", + "id": "grok-3", + "name": "grok-3", + "display_name": "grok-3", "limit": { "context": 8192, "output": 8192 @@ -80993,51 +92390,61 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.4 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "qwen2.5-math-1.5b-instruct", - "name": "qwen2.5-math-1.5b-instruct", - "display_name": "qwen2.5-math-1.5b-instruct", + "id": "aihub-Phi-4-mini-instruct", + "name": "aihub-Phi-4-mini-instruct", + "display_name": "aihub-Phi-4-mini-instruct", + "modalities": { + "input": [ + "text" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 128000 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.12, + "output": 0.48 }, "type": "chat" }, { - "id": "qwen2.5-math-72b-instruct", - "name": "qwen2.5-math-72b-instruct", - "display_name": "qwen2.5-math-72b-instruct", + "id": "aihub-Phi-4", + "name": "aihub-Phi-4", + "display_name": "aihub-Phi-4", + "modalities": { + "input": [ + "text" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 16400, + "output": 16400 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.8, - "output": 2.4 + "input": 0.12, + "output": 0.48 }, "type": "chat" }, { - "id": "qwen2.5-math-7b-instruct", - "name": "qwen2.5-math-7b-instruct", - "display_name": "qwen2.5-math-7b-instruct", + "id": "claude-3-opus-20240229", + "name": "claude-3-opus-20240229", + "display_name": "claude-3-opus-20240229", "limit": { "context": 8192, "output": 8192 @@ -81047,15 +92454,21 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.4 + "input": 16.5, + "output": 82.5 }, "type": "chat" }, { - "id": "sonar-reasoning-pro", - "name": "sonar-reasoning-pro", - "display_name": "sonar-reasoning-pro", + "id": "dall-e-3", + "name": "dall-e-3", + "display_name": "dall-e-3", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -81065,15 +92478,20 @@ "supported": false }, "cost": { - "input": 3, - "output": 12 + "input": 40, + "output": 40 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "sophnet-glm-4.7", - "name": "sophnet-glm-4.7", - "display_name": "sophnet-glm-4.7", + "id": "doubao-embedding-text-240715", + "name": "doubao-embedding-text-240715", + "display_name": "doubao-embedding-text-240715", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -81083,16 +92501,15 @@ "supported": false }, "cost": { - "input": 0.273974, - "output": 1.095896, - "cache_read": 0.273974 + "input": 0.7, + "output": 0.7 }, - "type": "chat" + "type": "embedding" }, { - "id": "sophnet-minimax-m2.1", - "name": "sophnet-minimax-m2.1", - "display_name": "sophnet-minimax-m2.1", + "id": "qwen3-14b", + "name": "qwen3-14b", + "display_name": "qwen3-14b", "limit": { "context": 8192, "output": 8192 @@ -81102,15 +92519,16 @@ "supported": false }, "cost": { - "input": 0.2876, - "output": 1.1504 + "input": 0.16, + "output": 1.6, + "cache_read": 0 }, "type": "chat" }, { - "id": "step-2-16k", - "name": "step-2-16k", - "display_name": "step-2-16k", + "id": "grok-3-beta", + "name": "grok-3-beta", + "display_name": "grok-3-beta", "limit": { "context": 8192, "output": 8192 @@ -81120,15 +92538,16 @@ "supported": false }, "cost": { - "input": 2, - "output": 2 + "input": 3, + "output": 15, + "cache_read": 0 }, "type": "chat" }, { - "id": "text-ada-001", - "name": "text-ada-001", - "display_name": "text-ada-001", + "id": "grok-3-fast", + "name": "grok-3-fast", + "display_name": "grok-3-fast", "limit": { "context": 8192, "output": 8192 @@ -81138,15 +92557,16 @@ "supported": false }, "cost": { - "input": 0.4, - "output": 0.4 + "input": 5.5, + "output": 27.5, + "cache_read": 0 }, "type": "chat" }, { - "id": "text-babbage-001", - "name": "text-babbage-001", - "display_name": "text-babbage-001", + "id": "qwen3-8b", + "name": "qwen3-8b", + "display_name": "qwen3-8b", "limit": { "context": 8192, "output": 8192 @@ -81156,15 +92576,16 @@ "supported": false }, "cost": { - "input": 0.5, - "output": 0.5 + "input": 0.08, + "output": 0.8, + "cache_read": 0 }, "type": "chat" }, { - "id": "text-curie-001", - "name": "text-curie-001", - "display_name": "text-curie-001", + "id": "qwen3-4b", + "name": "qwen3-4b", + "display_name": "qwen3-4b", "limit": { "context": 8192, "output": 8192 @@ -81174,15 +92595,16 @@ "supported": false }, "cost": { - "input": 2, - "output": 2 + "input": 0.046, + "output": 0.46, + "cache_read": 0 }, "type": "chat" }, { - "id": "text-davinci-002", - "name": "text-davinci-002", - "display_name": "text-davinci-002", + "id": "deepseek-ai/DeepSeek-R1-Zero", + "name": "deepseek-ai/DeepSeek-R1-Zero", + "display_name": "deepseek-ai/DeepSeek-R1-Zero", "limit": { "context": 8192, "output": 8192 @@ -81192,15 +92614,15 @@ "supported": false }, "cost": { - "input": 20, - "output": 20 + "input": 2.2, + "output": 2.2 }, "type": "chat" }, { - "id": "text-davinci-003", - "name": "text-davinci-003", - "display_name": "text-davinci-003", + "id": "grok-3-fast-beta", + "name": "grok-3-fast-beta", + "display_name": "grok-3-fast-beta", "limit": { "context": 8192, "output": 8192 @@ -81210,15 +92632,16 @@ "supported": false }, "cost": { - "input": 20, - "output": 20 + "input": 5.5, + "output": 27.5, + "cache_read": 0 }, "type": "chat" }, { - "id": "text-davinci-edit-001", - "name": "text-davinci-edit-001", - "display_name": "text-davinci-edit-001", + "id": "grok-3-mini", + "name": "grok-3-mini", + "display_name": "grok-3-mini", "limit": { "context": 8192, "output": 8192 @@ -81228,20 +92651,16 @@ "supported": false }, "cost": { - "input": 20, - "output": 20 + "input": 0.3, + "output": 0.501, + "cache_read": 0 }, "type": "chat" }, { - "id": "text-embedding-3-large", - "name": "text-embedding-3-large", - "display_name": "text-embedding-3-large", - "modalities": { - "input": [ - "text" - ] - }, + "id": "grok-3-mini-beta", + "name": "grok-3-mini-beta", + "display_name": "grok-3-mini-beta", "limit": { "context": 8192, "output": 8192 @@ -81251,20 +92670,16 @@ "supported": false }, "cost": { - "input": 0.13, - "output": 0.13 + "input": 0.33, + "output": 0.5511, + "cache_read": 0 }, - "type": "embedding" + "type": "chat" }, { - "id": "text-embedding-3-small", - "name": "text-embedding-3-small", - "display_name": "text-embedding-3-small", - "modalities": { - "input": [ - "text" - ] - }, + "id": "qwen3-1.7b", + "name": "qwen3-1.7b", + "display_name": "qwen3-1.7b", "limit": { "context": 8192, "output": 8192 @@ -81274,20 +92689,16 @@ "supported": false }, "cost": { - "input": 0.02, - "output": 0.02 + "input": 0.046, + "output": 0.46, + "cache_read": 0 }, - "type": "embedding" + "type": "chat" }, { - "id": "text-embedding-ada-002", - "name": "text-embedding-ada-002", - "display_name": "text-embedding-ada-002", - "modalities": { - "input": [ - "text" - ] - }, + "id": "qwen3-0.6b", + "name": "qwen3-0.6b", + "display_name": "qwen3-0.6b", "limit": { "context": 8192, "output": 8192 @@ -81297,20 +92708,16 @@ "supported": false }, "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.046, + "output": 0.46, + "cache_read": 0 }, - "type": "embedding" + "type": "chat" }, { - "id": "text-embedding-v1", - "name": "text-embedding-v1", - "display_name": "text-embedding-v1", - "modalities": { - "input": [ - "text" - ] - }, + "id": "qwen-3-32b", + "name": "qwen-3-32b", + "display_name": "qwen-3-32b", "limit": { "context": 8192, "output": 8192 @@ -81320,15 +92727,15 @@ "supported": false }, "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.4, + "output": 1.6 }, - "type": "embedding" + "type": "chat" }, { - "id": "text-moderation-007", - "name": "text-moderation-007", - "display_name": "text-moderation-007", + "id": "qwen-turbo-2025-04-28", + "name": "qwen-turbo-2025-04-28", + "display_name": "qwen-turbo-2025-04-28", "limit": { "context": 8192, "output": 8192 @@ -81338,15 +92745,16 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.046, + "output": 0.92, + "cache_read": 0 }, "type": "chat" }, { - "id": "text-moderation-latest", - "name": "text-moderation-latest", - "display_name": "text-moderation-latest", + "id": "grok-3-mini-fast-beta", + "name": "grok-3-mini-fast-beta", + "display_name": "grok-3-mini-fast-beta", "limit": { "context": 8192, "output": 8192 @@ -81356,15 +92764,20 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.33, + "output": 2.20011 }, "type": "chat" }, { - "id": "text-moderation-stable", - "name": "text-moderation-stable", - "display_name": "text-moderation-stable", + "id": "command-a-03-2025", + "name": "command-a-03-2025", + "display_name": "command-a-03-2025", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -81374,15 +92787,16 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.2 + "input": 2.5, + "output": 10, + "cache_read": 0 }, "type": "chat" }, { - "id": "text-search-ada-doc-001", - "name": "text-search-ada-doc-001", - "display_name": "text-search-ada-doc-001", + "id": "qwen-plus-2025-04-28", + "name": "qwen-plus-2025-04-28", + "display_name": "qwen-plus-2025-04-28", "limit": { "context": 8192, "output": 8192 @@ -81392,20 +92806,16 @@ "supported": false }, "cost": { - "input": 20, - "output": 20 + "input": 0.13, + "output": 2.6, + "cache_read": 0 }, "type": "chat" }, { - "id": "tts-1", - "name": "tts-1", - "display_name": "tts-1", - "modalities": { - "input": [ - "audio" - ] - }, + "id": "THUDM/GLM-Z1-32B-0414", + "name": "THUDM/GLM-Z1-32B-0414", + "display_name": "THUDM/GLM-Z1-32B-0414", "limit": { "context": 8192, "output": 8192 @@ -81415,19 +92825,15 @@ "supported": false }, "cost": { - "input": 15, - "output": 15 - } + "input": 0.08, + "output": 0.08 + }, + "type": "chat" }, { - "id": "tts-1-1106", - "name": "tts-1-1106", - "display_name": "tts-1-1106", - "modalities": { - "input": [ - "audio" - ] - }, + "id": "Pro/THUDM/GLM-4.1V-9B-Thinking", + "name": "Pro/THUDM/GLM-4.1V-9B-Thinking", + "display_name": "Pro/THUDM/GLM-4.1V-9B-Thinking", "limit": { "context": 8192, "output": 8192 @@ -81437,19 +92843,16 @@ "supported": false }, "cost": { - "input": 15, - "output": 15 - } + "input": 0.04, + "output": 0.16, + "cache_read": 0 + }, + "type": "chat" }, { - "id": "tts-1-hd", - "name": "tts-1-hd", - "display_name": "tts-1-hd", - "modalities": { - "input": [ - "audio" - ] - }, + "id": "THUDM/GLM-4.1V-9B-Thinking", + "name": "THUDM/GLM-4.1V-9B-Thinking", + "display_name": "THUDM/GLM-4.1V-9B-Thinking", "limit": { "context": 8192, "output": 8192 @@ -81459,19 +92862,16 @@ "supported": false }, "cost": { - "input": 30, - "output": 30 - } + "input": 0.1, + "output": 0.1, + "cache_read": 0 + }, + "type": "chat" }, { - "id": "tts-1-hd-1106", - "name": "tts-1-hd-1106", - "display_name": "tts-1-hd-1106", - "modalities": { - "input": [ - "audio" - ] - }, + "id": "text-embedding-004", + "name": "text-embedding-004", + "display_name": "text-embedding-004", "limit": { "context": 8192, "output": 8192 @@ -81481,22 +92881,15 @@ "supported": false }, "cost": { - "input": 30, - "output": 30 - } + "input": 0.02, + "output": 0.02 + }, + "type": "chat" }, { - "id": "veo-3", - "name": "veo-3", - "display_name": "veo-3", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video" - ] - }, + "id": "THUDM/GLM-4-32B-0414", + "name": "THUDM/GLM-4-32B-0414", + "display_name": "THUDM/GLM-4-32B-0414", "limit": { "context": 8192, "output": 8192 @@ -81506,24 +92899,15 @@ "supported": false }, "cost": { - "input": 2, - "output": 2, - "cache_read": 0 + "input": 0.08, + "output": 0.08 }, "type": "chat" }, { - "id": "veo3", - "name": "veo3", - "display_name": "veo3", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video" - ] - }, + "id": "THUDM/GLM-Z1-9B-0414", + "name": "THUDM/GLM-Z1-9B-0414", + "display_name": "THUDM/GLM-Z1-9B-0414", "limit": { "context": 8192, "output": 8192 @@ -81533,21 +92917,15 @@ "supported": false }, "cost": { - "input": 2, - "output": 2, - "cache_read": 0 + "input": 0.05, + "output": 0.05 }, "type": "chat" }, { - "id": "whisper-1", - "name": "whisper-1", - "display_name": "whisper-1", - "modalities": { - "input": [ - "audio" - ] - }, + "id": "THUDM/GLM-4-9B-0414", + "name": "THUDM/GLM-4-9B-0414", + "display_name": "THUDM/GLM-4-9B-0414", "limit": { "context": 8192, "output": 8192 @@ -81557,20 +92935,15 @@ "supported": false }, "cost": { - "input": 100, - "output": 100 + "input": 0.05, + "output": 0.05 }, "type": "chat" }, { - "id": "whisper-large-v3", - "name": "whisper-large-v3", - "display_name": "whisper-large-v3", - "modalities": { - "input": [ - "audio" - ] - }, + "id": "cc-doubao-seed-code-preview-latest", + "name": "cc-doubao-seed-code-preview-latest", + "display_name": "cc-doubao-seed-code-preview-latest", "limit": { "context": 8192, "output": 8192 @@ -81580,20 +92953,15 @@ "supported": false }, "cost": { - "input": 30.834, - "output": 30.834 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "whisper-large-v3-turbo", - "name": "whisper-large-v3-turbo", - "display_name": "whisper-large-v3-turbo", - "modalities": { - "input": [ - "audio" - ] - }, + "id": "doubao-seed-code-preview-latest", + "name": "doubao-seed-code-preview-latest", + "display_name": "doubao-seed-code-preview-latest", "limit": { "context": 8192, "output": 8192 @@ -81603,15 +92971,15 @@ "supported": false }, "cost": { - "input": 5.556, - "output": 5.556 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "yi-large", - "name": "yi-large", - "display_name": "yi-large", + "id": "deepseek-ai/Janus-Pro-7B", + "name": "deepseek-ai/Janus-Pro-7B", + "display_name": "deepseek-ai/Janus-Pro-7B", "limit": { "context": 8192, "output": 8192 @@ -81621,15 +92989,15 @@ "supported": false }, "cost": { - "input": 3, - "output": 3 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "yi-large-rag", - "name": "yi-large-rag", - "display_name": "yi-large-rag", + "id": "qwen-3-235b-a22b-instruct-2507", + "name": "qwen-3-235b-a22b-instruct-2507", + "display_name": "qwen-3-235b-a22b-instruct-2507", "limit": { "context": 8192, "output": 8192 @@ -81639,15 +93007,15 @@ "supported": false }, "cost": { - "input": 4, - "output": 4 + "input": 0.28, + "output": 1.4 }, "type": "chat" }, { - "id": "yi-large-turbo", - "name": "yi-large-turbo", - "display_name": "yi-large-turbo", + "id": "glm-zero-preview", + "name": "glm-zero-preview", + "display_name": "glm-zero-preview", "limit": { "context": 8192, "output": 8192 @@ -81657,15 +93025,15 @@ "supported": false }, "cost": { - "input": 1.8, - "output": 1.8 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "yi-lightning", - "name": "yi-lightning", - "display_name": "yi-lightning", + "id": "gemini-2.0-flash-thinking-exp-1219", + "name": "gemini-2.0-flash-thinking-exp-1219", + "display_name": "gemini-2.0-flash-thinking-exp-1219", "limit": { "context": 8192, "output": 8192 @@ -81675,33 +93043,38 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.076, + "output": 0.304 }, "type": "chat" }, { - "id": "yi-medium", - "name": "yi-medium", - "display_name": "yi-medium", + "id": "glm-4.5-air", + "name": "glm-4.5-air", + "display_name": "glm-4.5-air", + "modalities": { + "input": [ + "text" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 131072, + "output": 131072 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.4, - "output": 0.4 + "input": 0.14, + "output": 0.84 }, "type": "chat" }, { - "id": "yi-vl-plus", - "name": "yi-vl-plus", - "display_name": "yi-vl-plus", + "id": "gpt-4-32k", + "name": "gpt-4-32k", + "display_name": "gpt-4-32k", "limit": { "context": 8192, "output": 8192 @@ -81711,15 +93084,20 @@ "supported": false }, "cost": { - "input": 0.000852, - "output": 0.000852 + "input": 60, + "output": 120 }, "type": "chat" }, { - "id": "fx-flux-2-pro", - "name": "fx-flux-2-pro", - "display_name": "fx-flux-2-pro", + "id": "coding-glm-4.5-air", + "name": "coding-glm-4.5-air", + "display_name": "coding-glm-4.5-air", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -81729,16 +93107,15 @@ "supported": false }, "cost": { - "input": 2, - "output": 0, - "cache_read": 0 + "input": 0.014, + "output": 0.084 }, "type": "chat" }, { - "id": "gemini-2.0-flash-001", - "name": "gemini-2.0-flash-001", - "display_name": "gemini-2.0-flash-001", + "id": "nvidia-llama-3.1-nemotron-70b-instruct", + "name": "nvidia-llama-3.1-nemotron-70b-instruct", + "display_name": "nvidia-llama-3.1-nemotron-70b-instruct", "limit": { "context": 8192, "output": 8192 @@ -81748,16 +93125,15 @@ "supported": false }, "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.25 + "input": 1.32, + "output": 1.32 }, "type": "chat" }, { - "id": "gemini-2.0-flash-exp-image-generation", - "name": "gemini-2.0-flash-exp-image-generation", - "display_name": "gemini-2.0-flash-exp-image-generation", + "id": "nvidia-llama-3.3-nemotron-super-49b-v1.5", + "name": "nvidia-llama-3.3-nemotron-super-49b-v1.5", + "display_name": "nvidia-llama-3.3-nemotron-super-49b-v1.5", "limit": { "context": 8192, "output": 8192 @@ -81767,23 +93143,15 @@ "supported": false }, "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.11, + "output": 0.44 }, "type": "chat" }, { - "id": "gemini-2.0-flash-lite", - "name": "gemini-2.0-flash-lite", - "display_name": "gemini-2.0-flash-lite", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video" - ] - }, + "id": "nvidia-nemotron-3-nano-30b-a3b", + "name": "nvidia-nemotron-3-nano-30b-a3b", + "display_name": "nvidia-nemotron-3-nano-30b-a3b", "limit": { "context": 8192, "output": 8192 @@ -81793,16 +93161,15 @@ "supported": false }, "cost": { - "input": 0.076, - "output": 0.304, - "cache_read": 0.076 + "input": 0.066, + "output": 0.264 }, "type": "chat" }, { - "id": "gemini-2.0-flash-lite-001", - "name": "gemini-2.0-flash-lite-001", - "display_name": "gemini-2.0-flash-lite-001", + "id": "nvidia-nemotron-nano-12b-v2-vl", + "name": "nvidia-nemotron-nano-12b-v2-vl", + "display_name": "nvidia-nemotron-nano-12b-v2-vl", "limit": { "context": 8192, "output": 8192 @@ -81812,48 +93179,33 @@ "supported": false }, "cost": { - "input": 0.076, - "output": 0.304, - "cache_read": 0.076 + "input": 0.22, + "output": 0.66 }, "type": "chat" }, { - "id": "gemini-2.5-pro-exp-03-25", - "name": "gemini-2.5-pro-exp-03-25", - "display_name": "gemini-2.5-pro-exp-03-25", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video" - ] - }, + "id": "nvidia-nemotron-nano-9b-v2", + "name": "nvidia-nemotron-nano-9b-v2", + "display_name": "nvidia-nemotron-nano-9b-v2", "limit": { "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 1.25, - "output": 5, - "cache_read": 0.125 + "input": 0.044, + "output": 0.176 }, "type": "chat" }, { - "id": "gemini-embedding-exp-03-07", - "name": "gemini-embedding-exp-03-07", - "display_name": "gemini-embedding-exp-03-07", - "modalities": { - "input": [ - "text" - ] - }, + "id": "o1-preview-2024-09-12", + "name": "o1-preview-2024-09-12", + "display_name": "o1-preview-2024-09-12", "limit": { "context": 8192, "output": 8192 @@ -81863,15 +93215,16 @@ "supported": false }, "cost": { - "input": 0.02, - "output": 0.02 + "input": 15, + "output": 60, + "cache_read": 7.5 }, - "type": "embedding" + "type": "chat" }, { - "id": "gemini-exp-1114", - "name": "gemini-exp-1114", - "display_name": "gemini-exp-1114", + "id": "Qwen/QVQ-72B-Preview", + "name": "Qwen/QVQ-72B-Preview", + "display_name": "Qwen/QVQ-72B-Preview", "limit": { "context": 8192, "output": 8192 @@ -81881,15 +93234,15 @@ "supported": false }, "cost": { - "input": 1.25, - "output": 5 + "input": 1.2, + "output": 1.2 }, "type": "chat" }, { - "id": "gemini-exp-1121", - "name": "gemini-exp-1121", - "display_name": "gemini-exp-1121", + "id": "Qwen/QwQ-32B-Preview", + "name": "Qwen/QwQ-32B-Preview", + "display_name": "Qwen/QwQ-32B-Preview", "limit": { "context": 8192, "output": 8192 @@ -81899,15 +93252,15 @@ "supported": false }, "cost": { - "input": 1.25, - "output": 5 + "input": 0.16, + "output": 0.16 }, "type": "chat" }, { - "id": "gemini-pro", - "name": "gemini-pro", - "display_name": "gemini-pro", + "id": "llama-3.1-sonar-huge-128k-online", + "name": "llama-3.1-sonar-huge-128k-online", + "display_name": "llama-3.1-sonar-huge-128k-online", "limit": { "context": 8192, "output": 8192 @@ -81917,15 +93270,15 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.6 + "input": 5.6, + "output": 5.6 }, "type": "chat" - }, - { - "id": "gemini-pro-vision", - "name": "gemini-pro-vision", - "display_name": "gemini-pro-vision", + }, + { + "id": "llama-3.1-sonar-large-128k-online", + "name": "llama-3.1-sonar-large-128k-online", + "display_name": "llama-3.1-sonar-large-128k-online", "limit": { "context": 8192, "output": 8192 @@ -81935,15 +93288,15 @@ "supported": false }, "cost": { - "input": 1, - "output": 1 + "input": 1.2, + "output": 1.2 }, "type": "chat" }, { - "id": "gemma-7b-it", - "name": "gemma-7b-it", - "display_name": "gemma-7b-it", + "id": "aihubmix-Mistral-Large-2411", + "name": "aihubmix-Mistral-Large-2411", + "display_name": "aihubmix-Mistral-Large-2411", "limit": { "context": 8192, "output": 8192 @@ -81953,15 +93306,15 @@ "supported": false }, "cost": { - "input": 0.1, - "output": 0.1 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "gemma2-9b-it", - "name": "gemma2-9b-it", - "display_name": "gemma2-9b-it", + "id": "aihubmix-Mistral-large-2407", + "name": "aihubmix-Mistral-large-2407", + "display_name": "aihubmix-Mistral-large-2407", "limit": { "context": 8192, "output": 8192 @@ -81971,15 +93324,15 @@ "supported": false }, "cost": { - "input": 0.4, - "output": 0.4 + "input": 3, + "output": 9 }, "type": "chat" }, { - "id": "glm-3-turbo", - "name": "glm-3-turbo", - "display_name": "glm-3-turbo", + "id": "grok-2-1212", + "name": "grok-2-1212", + "display_name": "grok-2-1212", "limit": { "context": 8192, "output": 8192 @@ -81989,15 +93342,15 @@ "supported": false }, "cost": { - "input": 0.71, - "output": 0.71 + "input": 1.8, + "output": 9 }, "type": "chat" }, { - "id": "glm-4", - "name": "glm-4", - "display_name": "glm-4", + "id": "llama-3.1-70b", + "name": "llama-3.1-70b", + "display_name": "llama-3.1-70b", "limit": { "context": 8192, "output": 8192 @@ -82007,15 +93360,15 @@ "supported": false }, "cost": { - "input": 14.2, - "output": 14.2 + "input": 0.44, + "output": 0.44 }, "type": "chat" }, { - "id": "glm-4-flash", - "name": "glm-4-flash", - "display_name": "glm-4-flash", + "id": "gemini-2.0-flash-thinking-exp", + "name": "gemini-2.0-flash-thinking-exp", + "display_name": "gemini-2.0-flash-thinking-exp", "limit": { "context": 8192, "output": 8192 @@ -82025,15 +93378,15 @@ "supported": false }, "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.076, + "output": 0.304 }, "type": "chat" }, { - "id": "glm-4-plus", - "name": "glm-4-plus", - "display_name": "glm-4-plus", + "id": "gpt-image-test", + "name": "gpt-image-test", + "display_name": "gpt-image-test", "limit": { "context": 8192, "output": 8192 @@ -82043,18 +93396,20 @@ "supported": false }, "cost": { - "input": 8, - "output": 8 + "input": 5, + "output": 40, + "cache_read": 0 }, "type": "chat" }, { - "id": "glm-4.5-airx", - "name": "glm-4.5-airx", - "display_name": "glm-4.5-airx", + "id": "imagen-3.0-generate-002", + "name": "imagen-3.0-generate-002", + "display_name": "imagen-3.0-generate-002", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { @@ -82066,16 +93421,16 @@ "supported": false }, "cost": { - "input": 1.1, - "output": 4.51, - "cache_read": 0.22 + "input": 2, + "output": 2, + "cache_read": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "glm-4v", - "name": "glm-4v", - "display_name": "glm-4v", + "id": "llama3.1-8b", + "name": "llama3.1-8b", + "display_name": "llama3.1-8b", "limit": { "context": 8192, "output": 8192 @@ -82085,15 +93440,21 @@ "supported": false }, "cost": { - "input": 14.2, - "output": 14.2 + "input": 0.3, + "output": 0.6 }, "type": "chat" }, { - "id": "glm-4v-plus", - "name": "glm-4v-plus", - "display_name": "glm-4v-plus", + "id": "DESCRIBE", + "name": "DESCRIBE", + "display_name": "DESCRIBE", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -82104,14 +93465,21 @@ }, "cost": { "input": 2, - "output": 2 + "output": 2, + "cache_read": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "google-gemma-3-12b-it", - "name": "google-gemma-3-12b-it", - "display_name": "google-gemma-3-12b-it", + "id": "UPSCALE", + "name": "UPSCALE", + "display_name": "UPSCALE", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -82121,15 +93489,16 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.2 + "input": 2, + "output": 2, + "cache_read": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "google-gemma-3-27b-it", - "name": "google-gemma-3-27b-it", - "display_name": "google-gemma-3-27b-it", + "id": "bai-qwen3-vl-235b-a22b-instruct", + "name": "bai-qwen3-vl-235b-a22b-instruct", + "display_name": "bai-qwen3-vl-235b-a22b-instruct", "limit": { "context": 8192, "output": 8192 @@ -82139,35 +93508,38 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.2, - "cache_read": 0 + "input": 0.274, + "output": 1.096 }, "type": "chat" }, { - "id": "google-gemma-3-4b-it", - "name": "google-gemma-3-4b-it", - "display_name": "google-gemma-3-4b-it", + "id": "cc-MiniMax-M2", + "name": "cc-MiniMax-M2", + "display_name": "cc-MiniMax-M2", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.2, - "output": 0.2, - "cache_read": 0 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "google/gemini-exp-1114", - "name": "google/gemini-exp-1114", - "display_name": "google/gemini-exp-1114", + "id": "cc-deepseek-v3", + "name": "cc-deepseek-v3", + "display_name": "cc-deepseek-v3", "limit": { "context": 8192, "output": 8192 @@ -82177,51 +93549,63 @@ "supported": false }, "cost": { - "input": 1.25, - "output": 5 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "google/gemma-2-27b-it", - "name": "google/gemma-2-27b-it", - "display_name": "google/gemma-2-27b-it", + "id": "cc-deepseek-v3.1", + "name": "cc-deepseek-v3.1", + "display_name": "cc-deepseek-v3.1", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.8, - "output": 0.8 + "input": 0.56, + "output": 1.68 }, "type": "chat" }, { - "id": "google/gemma-2-9b-it:free", - "name": "google/gemma-2-9b-it:free", - "display_name": "google/gemma-2-9b-it:free", + "id": "cc-ernie-4.5-300b-a47b", + "name": "cc-ernie-4.5-300b-a47b", + "display_name": "cc-ernie-4.5-300b-a47b", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.02, - "output": 0.02 + "input": 0.32, + "output": 1.28, + "cache_read": 0 }, "type": "chat" }, { - "id": "gpt-3.5-turbo", - "name": "gpt-3.5-turbo", - "display_name": "gpt-3.5-turbo", + "id": "cc-kimi-dev-72b", + "name": "cc-kimi-dev-72b", + "display_name": "cc-kimi-dev-72b", "limit": { "context": 8192, "output": 8192 @@ -82231,51 +93615,62 @@ "supported": false }, "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.32, + "output": 1.28, + "cache_read": 0 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-0301", - "name": "gpt-3.5-turbo-0301", - "display_name": "gpt-3.5-turbo-0301", + "id": "cc-kimi-k2-instruct", + "name": "cc-kimi-k2-instruct", + "display_name": "cc-kimi-k2-instruct", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 1.5, - "output": 1.5 + "input": 1.1, + "output": 3.3 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-0613", - "name": "gpt-3.5-turbo-0613", - "display_name": "gpt-3.5-turbo-0613", + "id": "cc-kimi-k2-instruct-0905", + "name": "cc-kimi-k2-instruct-0905", + "display_name": "cc-kimi-k2-instruct-0905", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 1.5, - "output": 2 + "input": 1.1, + "output": 3.3 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-1106", - "name": "gpt-3.5-turbo-1106", - "display_name": "gpt-3.5-turbo-1106", + "id": "cc-kimi-k2-thinking", + "name": "cc-kimi-k2-thinking", + "display_name": "cc-kimi-k2-thinking", "limit": { "context": 8192, "output": 8192 @@ -82285,15 +93680,15 @@ "supported": false }, "cost": { - "input": 1, - "output": 2 + "input": 0.548, + "output": 2.192 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-16k", - "name": "gpt-3.5-turbo-16k", - "display_name": "gpt-3.5-turbo-16k", + "id": "computer-use-preview", + "name": "computer-use-preview", + "display_name": "computer-use-preview", "limit": { "context": 8192, "output": 8192 @@ -82304,14 +93699,14 @@ }, "cost": { "input": 3, - "output": 4 + "output": 12 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-16k-0613", - "name": "gpt-3.5-turbo-16k-0613", - "display_name": "gpt-3.5-turbo-16k-0613", + "id": "crush-glm-4.6-free", + "name": "crush-glm-4.6-free", + "display_name": "crush-glm-4.6-free", "limit": { "context": 8192, "output": 8192 @@ -82321,33 +93716,41 @@ "supported": false }, "cost": { - "input": 3, - "output": 4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-instruct", - "name": "gpt-3.5-turbo-instruct", - "display_name": "gpt-3.5-turbo-instruct", + "id": "o1-2024-12-17", + "name": "o1-2024-12-17", + "display_name": "o1-2024-12-17", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 1.5, - "output": 2 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "gpt-4", - "name": "gpt-4", - "display_name": "gpt-4", + "id": "sf-kimi-k2-thinking", + "name": "sf-kimi-k2-thinking", + "display_name": "sf-kimi-k2-thinking", "limit": { "context": 8192, "output": 8192 @@ -82357,15 +93760,15 @@ "supported": false }, "cost": { - "input": 30, - "output": 60 + "input": 0.548, + "output": 2.192 }, "type": "chat" }, { - "id": "gpt-4-0125-preview", - "name": "gpt-4-0125-preview", - "display_name": "gpt-4-0125-preview", + "id": "mistralai/mistral-7b-instruct:free", + "name": "mistralai/mistral-7b-instruct:free", + "display_name": "mistralai/mistral-7b-instruct:free", "limit": { "context": 8192, "output": 8192 @@ -82375,15 +93778,15 @@ "supported": false }, "cost": { - "input": 10, - "output": 30 + "input": 0.002, + "output": 0.002 }, "type": "chat" }, { - "id": "gpt-4-0314", - "name": "gpt-4-0314", - "display_name": "gpt-4-0314", + "id": "mm-minimax-m2.1", + "name": "mm-minimax-m2.1", + "display_name": "mm-minimax-m2.1", "limit": { "context": 8192, "output": 8192 @@ -82393,15 +93796,15 @@ "supported": false }, "cost": { - "input": 30, - "output": 60 + "input": 0.288, + "output": 1.152 }, "type": "chat" }, { - "id": "gpt-4-0613", - "name": "gpt-4-0613", - "display_name": "gpt-4-0613", + "id": "moonshot-kimi-k2.5", + "name": "moonshot-kimi-k2.5", + "display_name": "moonshot-kimi-k2.5", "limit": { "context": 8192, "output": 8192 @@ -82411,15 +93814,16 @@ "supported": false }, "cost": { - "input": 30, - "output": 60 + "input": 0.6, + "output": 3, + "cache_read": 0.105 }, "type": "chat" }, { - "id": "gpt-4-1106-preview", - "name": "gpt-4-1106-preview", - "display_name": "gpt-4-1106-preview", + "id": "moonshot-v1-128k", + "name": "moonshot-v1-128k", + "display_name": "moonshot-v1-128k", "limit": { "context": 8192, "output": 8192 @@ -82430,14 +93834,14 @@ }, "cost": { "input": 10, - "output": 30 + "output": 10 }, "type": "chat" }, { - "id": "gpt-4-32k-0314", - "name": "gpt-4-32k-0314", - "display_name": "gpt-4-32k-0314", + "id": "moonshot-v1-128k-vision-preview", + "name": "moonshot-v1-128k-vision-preview", + "display_name": "moonshot-v1-128k-vision-preview", "limit": { "context": 8192, "output": 8192 @@ -82447,15 +93851,15 @@ "supported": false }, "cost": { - "input": 60, - "output": 120 + "input": 10, + "output": 10 }, "type": "chat" }, { - "id": "gpt-4-32k-0613", - "name": "gpt-4-32k-0613", - "display_name": "gpt-4-32k-0613", + "id": "moonshot-v1-32k", + "name": "moonshot-v1-32k", + "display_name": "moonshot-v1-32k", "limit": { "context": 8192, "output": 8192 @@ -82465,15 +93869,15 @@ "supported": false }, "cost": { - "input": 60, - "output": 120 + "input": 4, + "output": 4 }, "type": "chat" }, { - "id": "gpt-4-turbo", - "name": "gpt-4-turbo", - "display_name": "gpt-4-turbo", + "id": "moonshot-v1-32k-vision-preview", + "name": "moonshot-v1-32k-vision-preview", + "display_name": "moonshot-v1-32k-vision-preview", "limit": { "context": 8192, "output": 8192 @@ -82483,15 +93887,15 @@ "supported": false }, "cost": { - "input": 10, - "output": 30 + "input": 4, + "output": 4 }, "type": "chat" }, { - "id": "gpt-4-turbo-2024-04-09", - "name": "gpt-4-turbo-2024-04-09", - "display_name": "gpt-4-turbo-2024-04-09", + "id": "moonshot-v1-8k", + "name": "moonshot-v1-8k", + "display_name": "moonshot-v1-8k", "limit": { "context": 8192, "output": 8192 @@ -82501,15 +93905,15 @@ "supported": false }, "cost": { - "input": 10, - "output": 30 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "gpt-4-turbo-preview", - "name": "gpt-4-turbo-preview", - "display_name": "gpt-4-turbo-preview", + "id": "moonshot-v1-8k-vision-preview", + "name": "moonshot-v1-8k-vision-preview", + "display_name": "moonshot-v1-8k-vision-preview", "limit": { "context": 8192, "output": 8192 @@ -82519,15 +93923,15 @@ "supported": false }, "cost": { - "input": 10, - "output": 30 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "gpt-4-vision-preview", - "name": "gpt-4-vision-preview", - "display_name": "gpt-4-vision-preview", + "id": "nvidia/Llama-3_1-Nemotron-Ultra-253B-v1", + "name": "nvidia/Llama-3_1-Nemotron-Ultra-253B-v1", + "display_name": "nvidia/Llama-3_1-Nemotron-Ultra-253B-v1", "limit": { "context": 8192, "output": 8192 @@ -82537,40 +93941,35 @@ "supported": false }, "cost": { - "input": 10, - "output": 30 + "input": 0.5, + "output": 0.5, + "cache_read": 0 }, "type": "chat" }, { - "id": "gpt-4o-2024-05-13", - "name": "gpt-4o-2024-05-13", - "display_name": "gpt-4o-2024-05-13", + "id": "o1-mini-2024-09-12", + "name": "o1-mini-2024-09-12", + "display_name": "o1-mini-2024-09-12", "limit": { - "context": 128000, - "output": 128000 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 5, - "output": 15, - "cache_read": 5 + "input": 3, + "output": 12, + "cache_read": 1.5 }, "type": "chat" }, { - "id": "gpt-4o-mini-2024-07-18", - "name": "gpt-4o-mini-2024-07-18", - "display_name": "gpt-4o-mini-2024-07-18", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "omni-moderation-latest", + "name": "omni-moderation-latest", + "display_name": "omni-moderation-latest", "limit": { "context": 8192, "output": 8192 @@ -82580,46 +93979,15 @@ "supported": false }, "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075 - }, - "type": "chat" - }, - { - "id": "gpt-oss-20b", - "name": "gpt-oss-20b", - "display_name": "gpt-oss-20b", - "modalities": { - "input": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 128000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "cost": { - "input": 0.11, - "output": 0.55 + "input": 0.02, + "output": 0.02 }, "type": "chat" }, { - "id": "grok-2-vision-1212", - "name": "grok-2-vision-1212", - "display_name": "grok-2-vision-1212", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "qwen-flash", + "name": "qwen-flash", + "display_name": "qwen-flash", "limit": { "context": 8192, "output": 8192 @@ -82629,21 +93997,16 @@ "supported": false }, "cost": { - "input": 1.8, - "output": 9 + "input": 0.02, + "output": 0.2, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "grok-vision-beta", - "name": "grok-vision-beta", - "display_name": "grok-vision-beta", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "qwen-flash-2025-07-28", + "name": "qwen-flash-2025-07-28", + "display_name": "qwen-flash-2025-07-28", "limit": { "context": 8192, "output": 8192 @@ -82653,15 +94016,16 @@ "supported": false }, "cost": { - "input": 5.6, - "output": 16.8 + "input": 0.02, + "output": 0.2, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "groq-llama-3.1-8b-instant", - "name": "groq-llama-3.1-8b-instant", - "display_name": "groq-llama-3.1-8b-instant", + "id": "qwen-long", + "name": "qwen-long", + "display_name": "qwen-long", "limit": { "context": 8192, "output": 8192 @@ -82671,15 +94035,15 @@ "supported": false }, "cost": { - "input": 0.055, - "output": 0.088 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "groq-llama-3.3-70b-versatile", - "name": "groq-llama-3.3-70b-versatile", - "display_name": "groq-llama-3.3-70b-versatile", + "id": "qwen-max", + "name": "qwen-max", + "display_name": "qwen-max", "limit": { "context": 8192, "output": 8192 @@ -82689,15 +94053,15 @@ "supported": false }, "cost": { - "input": 0.649, - "output": 0.869011 + "input": 0.38, + "output": 1.52 }, "type": "chat" }, { - "id": "groq-llama-4-maverick-17b-128e-instruct", - "name": "groq-llama-4-maverick-17b-128e-instruct", - "display_name": "groq-llama-4-maverick-17b-128e-instruct", + "id": "qwen-max-longcontext", + "name": "qwen-max-longcontext", + "display_name": "qwen-max-longcontext", "limit": { "context": 8192, "output": 8192 @@ -82707,15 +94071,15 @@ "supported": false }, "cost": { - "input": 0.22, - "output": 0.66 + "input": 7, + "output": 21 }, "type": "chat" }, { - "id": "groq-llama-4-scout-17b-16e-instruct", - "name": "groq-llama-4-scout-17b-16e-instruct", - "display_name": "groq-llama-4-scout-17b-16e-instruct", + "id": "qwen-plus", + "name": "qwen-plus", + "display_name": "qwen-plus", "limit": { "context": 8192, "output": 8192 @@ -82725,19 +94089,18 @@ "supported": false }, "cost": { - "input": 0.122, - "output": 0.366 + "input": 0.7, + "output": 2.1 }, "type": "chat" }, { - "id": "imagen-4.0-generate-preview-05-20", - "name": "imagen-4.0-generate-preview-05-20", - "display_name": "imagen-4.0-generate-preview-05-20", + "id": "qwen-turbo", + "name": "qwen-turbo", + "display_name": "qwen-turbo", "modalities": { "input": [ - "text", - "image" + "text" ] }, "limit": { @@ -82749,16 +94112,15 @@ "supported": false }, "cost": { - "input": 2, - "output": 2, - "cache_read": 0 + "input": 0.36, + "output": 1.08 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "jina-embeddings-v2-base-code", - "name": "jina-embeddings-v2-base-code", - "display_name": "jina-embeddings-v2-base-code", + "id": "qwen-turbo-2024-11-01", + "name": "qwen-turbo-2024-11-01", + "display_name": "qwen-turbo-2024-11-01", "modalities": { "input": [ "text" @@ -82773,15 +94135,15 @@ "supported": false }, "cost": { - "input": 0.05, - "output": 0.05 + "input": 0.36, + "output": 1.08 }, - "type": "embedding" + "type": "chat" }, { - "id": "learnlm-1.5-pro-experimental", - "name": "learnlm-1.5-pro-experimental", - "display_name": "learnlm-1.5-pro-experimental", + "id": "qwen2.5-14b-instruct", + "name": "qwen2.5-14b-instruct", + "display_name": "qwen2.5-14b-instruct", "limit": { "context": 8192, "output": 8192 @@ -82791,15 +94153,15 @@ "supported": false }, "cost": { - "input": 1.25, - "output": 5 + "input": 0.4, + "output": 1.2 }, "type": "chat" }, { - "id": "llama-3.1-405b-instruct", - "name": "llama-3.1-405b-instruct", - "display_name": "llama-3.1-405b-instruct", + "id": "qwen2.5-32b-instruct", + "name": "qwen2.5-32b-instruct", + "display_name": "qwen2.5-32b-instruct", "limit": { "context": 8192, "output": 8192 @@ -82809,15 +94171,15 @@ "supported": false }, "cost": { - "input": 4, - "output": 4 + "input": 0.6, + "output": 1.2 }, "type": "chat" }, { - "id": "llama-3.1-405b-reasoning", - "name": "llama-3.1-405b-reasoning", - "display_name": "llama-3.1-405b-reasoning", + "id": "qwen2.5-3b-instruct", + "name": "qwen2.5-3b-instruct", + "display_name": "qwen2.5-3b-instruct", "limit": { "context": 8192, "output": 8192 @@ -82827,15 +94189,15 @@ "supported": false }, "cost": { - "input": 4, - "output": 4 + "input": 0.4, + "output": 0.8 }, "type": "chat" }, { - "id": "llama-3.1-70b-versatile", - "name": "llama-3.1-70b-versatile", - "display_name": "llama-3.1-70b-versatile", + "id": "qwen2.5-72b-instruct", + "name": "qwen2.5-72b-instruct", + "display_name": "qwen2.5-72b-instruct", "limit": { "context": 8192, "output": 8192 @@ -82845,15 +94207,15 @@ "supported": false }, "cost": { - "input": 0.6, - "output": 0.6 + "input": 0.8, + "output": 2.4 }, "type": "chat" }, { - "id": "llama-3.1-8b-instant", - "name": "llama-3.1-8b-instant", - "display_name": "llama-3.1-8b-instant", + "id": "qwen2.5-7b-instruct", + "name": "qwen2.5-7b-instruct", + "display_name": "qwen2.5-7b-instruct", "limit": { "context": 8192, "output": 8192 @@ -82863,15 +94225,15 @@ "supported": false }, "cost": { - "input": 0.3, - "output": 0.6 + "input": 0.4, + "output": 0.8 }, "type": "chat" }, { - "id": "llama-3.1-sonar-small-128k-online", - "name": "llama-3.1-sonar-small-128k-online", - "display_name": "llama-3.1-sonar-small-128k-online", + "id": "qwen2.5-coder-1.5b-instruct", + "name": "qwen2.5-coder-1.5b-instruct", + "display_name": "qwen2.5-coder-1.5b-instruct", "limit": { "context": 8192, "output": 8192 @@ -82881,15 +94243,15 @@ "supported": false }, "cost": { - "input": 0.3, - "output": 0.3 + "input": 0.2, + "output": 0.4 }, "type": "chat" }, { - "id": "llama-3.2-11b-vision-preview", - "name": "llama-3.2-11b-vision-preview", - "display_name": "llama-3.2-11b-vision-preview", + "id": "qwen2.5-coder-7b-instruct", + "name": "qwen2.5-coder-7b-instruct", + "display_name": "qwen2.5-coder-7b-instruct", "limit": { "context": 8192, "output": 8192 @@ -82900,14 +94262,14 @@ }, "cost": { "input": 0.2, - "output": 0.2 + "output": 0.4 }, "type": "chat" }, { - "id": "llama-3.2-1b-preview", - "name": "llama-3.2-1b-preview", - "display_name": "llama-3.2-1b-preview", + "id": "qwen2.5-math-1.5b-instruct", + "name": "qwen2.5-math-1.5b-instruct", + "display_name": "qwen2.5-math-1.5b-instruct", "limit": { "context": 8192, "output": 8192 @@ -82923,9 +94285,9 @@ "type": "chat" }, { - "id": "llama-3.2-3b-preview", - "name": "llama-3.2-3b-preview", - "display_name": "llama-3.2-3b-preview", + "id": "qwen2.5-math-72b-instruct", + "name": "qwen2.5-math-72b-instruct", + "display_name": "qwen2.5-math-72b-instruct", "limit": { "context": 8192, "output": 8192 @@ -82935,15 +94297,15 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.8, + "output": 2.4 }, "type": "chat" }, { - "id": "llama-3.2-90b-vision-preview", - "name": "llama-3.2-90b-vision-preview", - "display_name": "llama-3.2-90b-vision-preview", + "id": "qwen2.5-math-7b-instruct", + "name": "qwen2.5-math-7b-instruct", + "display_name": "qwen2.5-math-7b-instruct", "limit": { "context": 8192, "output": 8192 @@ -82953,15 +94315,15 @@ "supported": false }, "cost": { - "input": 2.4, - "output": 2.4 + "input": 0.2, + "output": 0.4 }, "type": "chat" }, { - "id": "llama2-70b-4096", - "name": "llama2-70b-4096", - "display_name": "llama2-70b-4096", + "id": "sonar-reasoning-pro", + "name": "sonar-reasoning-pro", + "display_name": "sonar-reasoning-pro", "limit": { "context": 8192, "output": 8192 @@ -82971,15 +94333,15 @@ "supported": false }, "cost": { - "input": 0.5, - "output": 0.5 + "input": 3, + "output": 12 }, "type": "chat" }, { - "id": "llama2-70b-40960", - "name": "llama2-70b-40960", - "display_name": "llama2-70b-40960", + "id": "sophnet-glm-4.7", + "name": "sophnet-glm-4.7", + "display_name": "sophnet-glm-4.7", "limit": { "context": 8192, "output": 8192 @@ -82989,33 +94351,34 @@ "supported": false }, "cost": { - "input": 0.5, - "output": 0.5 + "input": 0.273974, + "output": 1.095896, + "cache_read": 0.273974 }, "type": "chat" }, { - "id": "llama2-7b-2048", - "name": "llama2-7b-2048", - "display_name": "llama2-7b-2048", + "id": "sophnet-kimi-k2.5", + "name": "sophnet-kimi-k2.5", + "display_name": "sophnet-kimi-k2.5", "limit": { - "context": 8192, - "output": 8192 + "context": 256000, + "output": 256000 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.548, + "output": 2.877 }, "type": "chat" }, { - "id": "llama3-70b-8192", - "name": "llama3-70b-8192", - "display_name": "llama3-70b-8192", + "id": "sophnet-minimax-m2.1", + "name": "sophnet-minimax-m2.1", + "display_name": "sophnet-minimax-m2.1", "limit": { "context": 8192, "output": 8192 @@ -83025,15 +94388,15 @@ "supported": false }, "cost": { - "input": 0.7, - "output": 0.937288 + "input": 0.2876, + "output": 1.1504 }, "type": "chat" }, { - "id": "llama3-8b-8192", - "name": "llama3-8b-8192", - "display_name": "llama3-8b-8192", + "id": "step-2-16k", + "name": "step-2-16k", + "display_name": "step-2-16k", "limit": { "context": 8192, "output": 8192 @@ -83043,15 +94406,15 @@ "supported": false }, "cost": { - "input": 0.06, - "output": 0.12 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "llama3-groq-70b-8192-tool-use-preview", - "name": "llama3-groq-70b-8192-tool-use-preview", - "display_name": "llama3-groq-70b-8192-tool-use-preview", + "id": "text-ada-001", + "name": "text-ada-001", + "display_name": "text-ada-001", "limit": { "context": 8192, "output": 8192 @@ -83061,15 +94424,15 @@ "supported": false }, "cost": { - "input": 0.00089, - "output": 0.00089 + "input": 0.4, + "output": 0.4 }, "type": "chat" }, { - "id": "llama3-groq-8b-8192-tool-use-preview", - "name": "llama3-groq-8b-8192-tool-use-preview", - "display_name": "llama3-groq-8b-8192-tool-use-preview", + "id": "text-babbage-001", + "name": "text-babbage-001", + "display_name": "text-babbage-001", "limit": { "context": 8192, "output": 8192 @@ -83079,15 +94442,15 @@ "supported": false }, "cost": { - "input": 0.00019, - "output": 0.00019 + "input": 0.5, + "output": 0.5 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.2-90B-Vision-Instruct", - "name": "meta-llama/Llama-3.2-90B-Vision-Instruct", - "display_name": "meta-llama/Llama-3.2-90B-Vision-Instruct", + "id": "text-curie-001", + "name": "text-curie-001", + "display_name": "text-curie-001", "limit": { "context": 8192, "output": 8192 @@ -83097,15 +94460,15 @@ "supported": false }, "cost": { - "input": 0.5, - "output": 0.5 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "meta-llama/llama-3.1-405b-instruct:free", - "name": "meta-llama/llama-3.1-405b-instruct:free", - "display_name": "meta-llama/llama-3.1-405b-instruct:free", + "id": "text-davinci-002", + "name": "text-davinci-002", + "display_name": "text-davinci-002", "limit": { "context": 8192, "output": 8192 @@ -83115,15 +94478,15 @@ "supported": false }, "cost": { - "input": 0.02, - "output": 0.02 + "input": 20, + "output": 20 }, "type": "chat" }, { - "id": "meta-llama/llama-3.1-70b-instruct:free", - "name": "meta-llama/llama-3.1-70b-instruct:free", - "display_name": "meta-llama/llama-3.1-70b-instruct:free", + "id": "text-davinci-003", + "name": "text-davinci-003", + "display_name": "text-davinci-003", "limit": { "context": 8192, "output": 8192 @@ -83133,15 +94496,15 @@ "supported": false }, "cost": { - "input": 0.02, - "output": 0.02 + "input": 20, + "output": 20 }, "type": "chat" }, { - "id": "meta-llama/llama-3.1-8b-instruct:free", - "name": "meta-llama/llama-3.1-8b-instruct:free", - "display_name": "meta-llama/llama-3.1-8b-instruct:free", + "id": "text-davinci-edit-001", + "name": "text-davinci-edit-001", + "display_name": "text-davinci-edit-001", "limit": { "context": 8192, "output": 8192 @@ -83151,15 +94514,20 @@ "supported": false }, "cost": { - "input": 0.02, - "output": 0.02 + "input": 20, + "output": 20 }, "type": "chat" }, { - "id": "meta-llama/llama-3.2-11b-vision-instruct:free", - "name": "meta-llama/llama-3.2-11b-vision-instruct:free", - "display_name": "meta-llama/llama-3.2-11b-vision-instruct:free", + "id": "text-embedding-3-large", + "name": "text-embedding-3-large", + "display_name": "text-embedding-3-large", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -83169,15 +94537,20 @@ "supported": false }, "cost": { - "input": 0.02, - "output": 0.02 + "input": 0.13, + "output": 0.13 }, - "type": "chat" + "type": "embedding" }, { - "id": "meta-llama/llama-3.2-3b-instruct:free", - "name": "meta-llama/llama-3.2-3b-instruct:free", - "display_name": "meta-llama/llama-3.2-3b-instruct:free", + "id": "text-embedding-3-small", + "name": "text-embedding-3-small", + "display_name": "text-embedding-3-small", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -83190,12 +94563,17 @@ "input": 0.02, "output": 0.02 }, - "type": "chat" + "type": "embedding" }, { - "id": "meta/llama-3.1-405b-instruct", - "name": "meta/llama-3.1-405b-instruct", - "display_name": "meta/llama-3.1-405b-instruct", + "id": "text-embedding-ada-002", + "name": "text-embedding-ada-002", + "display_name": "text-embedding-ada-002", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -83205,15 +94583,20 @@ "supported": false }, "cost": { - "input": 5, - "output": 5 + "input": 0.1, + "output": 0.1 }, - "type": "chat" + "type": "embedding" }, { - "id": "meta/llama3-8B-chat", - "name": "meta/llama3-8B-chat", - "display_name": "meta/llama3-8B-chat", + "id": "text-embedding-v1", + "name": "text-embedding-v1", + "display_name": "text-embedding-v1", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -83223,15 +94606,15 @@ "supported": false }, "cost": { - "input": 0.3, - "output": 0.3 + "input": 0.1, + "output": 0.1 }, - "type": "chat" + "type": "embedding" }, { - "id": "mistralai/mistral-7b-instruct:free", - "name": "mistralai/mistral-7b-instruct:free", - "display_name": "mistralai/mistral-7b-instruct:free", + "id": "text-moderation-007", + "name": "text-moderation-007", + "display_name": "text-moderation-007", "limit": { "context": 8192, "output": 8192 @@ -83241,15 +94624,15 @@ "supported": false }, "cost": { - "input": 0.002, - "output": 0.002 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "mm-minimax-m2.1", - "name": "mm-minimax-m2.1", - "display_name": "mm-minimax-m2.1", + "id": "text-moderation-latest", + "name": "text-moderation-latest", + "display_name": "text-moderation-latest", "limit": { "context": 8192, "output": 8192 @@ -83259,15 +94642,15 @@ "supported": false }, "cost": { - "input": 0.288, - "output": 1.152 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "moonshot-v1-128k", - "name": "moonshot-v1-128k", - "display_name": "moonshot-v1-128k", + "id": "text-moderation-stable", + "name": "text-moderation-stable", + "display_name": "text-moderation-stable", "limit": { "context": 8192, "output": 8192 @@ -83277,15 +94660,15 @@ "supported": false }, "cost": { - "input": 10, - "output": 10 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "moonshot-v1-128k-vision-preview", - "name": "moonshot-v1-128k-vision-preview", - "display_name": "moonshot-v1-128k-vision-preview", + "id": "text-search-ada-doc-001", + "name": "text-search-ada-doc-001", + "display_name": "text-search-ada-doc-001", "limit": { "context": 8192, "output": 8192 @@ -83295,15 +94678,20 @@ "supported": false }, "cost": { - "input": 10, - "output": 10 + "input": 20, + "output": 20 }, "type": "chat" }, { - "id": "moonshot-v1-32k", - "name": "moonshot-v1-32k", - "display_name": "moonshot-v1-32k", + "id": "tts-1", + "name": "tts-1", + "display_name": "tts-1", + "modalities": { + "input": [ + "audio" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -83313,15 +94701,41 @@ "supported": false }, "cost": { - "input": 4, - "output": 4 + "input": 15, + "output": 15 + } + }, + { + "id": "tts-1-1106", + "name": "tts-1-1106", + "display_name": "tts-1-1106", + "modalities": { + "input": [ + "audio" + ] }, - "type": "chat" + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 15, + "output": 15 + } }, { - "id": "moonshot-v1-32k-vision-preview", - "name": "moonshot-v1-32k-vision-preview", - "display_name": "moonshot-v1-32k-vision-preview", + "id": "tts-1-hd", + "name": "tts-1-hd", + "display_name": "tts-1-hd", + "modalities": { + "input": [ + "audio" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -83331,15 +94745,44 @@ "supported": false }, "cost": { - "input": 4, - "output": 4 + "input": 30, + "output": 30 + } + }, + { + "id": "tts-1-hd-1106", + "name": "tts-1-hd-1106", + "display_name": "tts-1-hd-1106", + "modalities": { + "input": [ + "audio" + ] }, - "type": "chat" + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 30, + "output": 30 + } }, { - "id": "moonshot-v1-8k", - "name": "moonshot-v1-8k", - "display_name": "moonshot-v1-8k", + "id": "veo-3", + "name": "veo-3", + "display_name": "veo-3", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -83350,14 +94793,23 @@ }, "cost": { "input": 2, - "output": 2 + "output": 2, + "cache_read": 0 }, "type": "chat" }, { - "id": "moonshot-v1-8k-vision-preview", - "name": "moonshot-v1-8k-vision-preview", - "display_name": "moonshot-v1-8k-vision-preview", + "id": "veo3", + "name": "veo3", + "display_name": "veo3", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -83368,14 +94820,20 @@ }, "cost": { "input": 2, - "output": 2 + "output": 2, + "cache_read": 0 }, "type": "chat" }, { - "id": "nvidia/Llama-3_1-Nemotron-Ultra-253B-v1", - "name": "nvidia/Llama-3_1-Nemotron-Ultra-253B-v1", - "display_name": "nvidia/Llama-3_1-Nemotron-Ultra-253B-v1", + "id": "whisper-1", + "name": "whisper-1", + "display_name": "whisper-1", + "modalities": { + "input": [ + "audio" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -83385,16 +94843,20 @@ "supported": false }, "cost": { - "input": 0.5, - "output": 0.5, - "cache_read": 0 + "input": 100, + "output": 100 }, "type": "chat" }, { - "id": "Baichuan3-Turbo", - "name": "Baichuan3-Turbo", - "display_name": "Baichuan3-Turbo", + "id": "whisper-large-v3", + "name": "whisper-large-v3", + "display_name": "whisper-large-v3", + "modalities": { + "input": [ + "audio" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -83404,15 +94866,20 @@ "supported": false }, "cost": { - "input": 1.9, - "output": 1.9 + "input": 30.834, + "output": 30.834 }, "type": "chat" }, { - "id": "Baichuan3-Turbo-128k", - "name": "Baichuan3-Turbo-128k", - "display_name": "Baichuan3-Turbo-128k", + "id": "whisper-large-v3-turbo", + "name": "whisper-large-v3-turbo", + "display_name": "whisper-large-v3-turbo", + "modalities": { + "input": [ + "audio" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -83422,15 +94889,15 @@ "supported": false }, "cost": { - "input": 3.8, - "output": 3.8 + "input": 5.556, + "output": 5.556 }, "type": "chat" }, { - "id": "Baichuan4", - "name": "Baichuan4", - "display_name": "Baichuan4", + "id": "yi-large", + "name": "yi-large", + "display_name": "yi-large", "limit": { "context": 8192, "output": 8192 @@ -83440,15 +94907,15 @@ "supported": false }, "cost": { - "input": 16, - "output": 16 + "input": 3, + "output": 3 }, "type": "chat" }, { - "id": "Baichuan4-Air", - "name": "Baichuan4-Air", - "display_name": "Baichuan4-Air", + "id": "yi-large-rag", + "name": "yi-large-rag", + "display_name": "yi-large-rag", "limit": { "context": 8192, "output": 8192 @@ -83458,15 +94925,15 @@ "supported": false }, "cost": { - "input": 0.16, - "output": 0.16 + "input": 4, + "output": 4 }, "type": "chat" }, { - "id": "Baichuan4-Turbo", - "name": "Baichuan4-Turbo", - "display_name": "Baichuan4-Turbo", + "id": "yi-large-turbo", + "name": "yi-large-turbo", + "display_name": "yi-large-turbo", "limit": { "context": 8192, "output": 8192 @@ -83476,15 +94943,15 @@ "supported": false }, "cost": { - "input": 2.4, - "output": 2.4 + "input": 1.8, + "output": 1.8 }, "type": "chat" }, { - "id": "DeepSeek-v3", - "name": "DeepSeek-v3", - "display_name": "DeepSeek-v3", + "id": "yi-lightning", + "name": "yi-lightning", + "display_name": "yi-lightning", "limit": { "context": 8192, "output": 8192 @@ -83494,15 +94961,15 @@ "supported": false }, "cost": { - "input": 0.272, - "output": 1.088 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "Doubao-1.5-lite-32k", - "name": "Doubao-1.5-lite-32k", - "display_name": "Doubao-1.5-lite-32k", + "id": "yi-medium", + "name": "yi-medium", + "display_name": "yi-medium", "limit": { "context": 8192, "output": 8192 @@ -83512,16 +94979,15 @@ "supported": false }, "cost": { - "input": 0.05, - "output": 0.1, - "cache_read": 0.01 + "input": 0.4, + "output": 0.4 }, "type": "chat" }, { - "id": "Doubao-1.5-pro-256k", - "name": "Doubao-1.5-pro-256k", - "display_name": "Doubao-1.5-pro-256k", + "id": "yi-vl-plus", + "name": "yi-vl-plus", + "display_name": "yi-vl-plus", "limit": { "context": 8192, "output": 8192 @@ -83531,16 +94997,15 @@ "supported": false }, "cost": { - "input": 0.8, - "output": 1.44, - "cache_read": 0.8 + "input": 0.000852, + "output": 0.000852 }, "type": "chat" }, { - "id": "Doubao-1.5-pro-32k", - "name": "Doubao-1.5-pro-32k", - "display_name": "Doubao-1.5-pro-32k", + "id": "fx-flux-2-pro", + "name": "fx-flux-2-pro", + "display_name": "fx-flux-2-pro", "limit": { "context": 8192, "output": 8192 @@ -83550,16 +95015,16 @@ "supported": false }, "cost": { - "input": 0.134, - "output": 0.335, - "cache_read": 0.0268 + "input": 2, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "Doubao-1.5-vision-pro-32k", - "name": "Doubao-1.5-vision-pro-32k", - "display_name": "Doubao-1.5-vision-pro-32k", + "id": "gemini-2.0-flash-001", + "name": "gemini-2.0-flash-001", + "display_name": "gemini-2.0-flash-001", "limit": { "context": 8192, "output": 8192 @@ -83569,15 +95034,16 @@ "supported": false }, "cost": { - "input": 0.46, - "output": 1.38 + "input": 0.1, + "output": 0.4, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "Doubao-lite-128k", - "name": "Doubao-lite-128k", - "display_name": "Doubao-lite-128k", + "id": "gemini-2.0-flash-exp-image-generation", + "name": "gemini-2.0-flash-exp-image-generation", + "display_name": "gemini-2.0-flash-exp-image-generation", "limit": { "context": 8192, "output": 8192 @@ -83587,16 +95053,23 @@ "supported": false }, "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.14 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "Doubao-lite-32k", - "name": "Doubao-lite-32k", - "display_name": "Doubao-lite-32k", + "id": "gemini-2.0-flash-lite", + "name": "gemini-2.0-flash-lite", + "display_name": "gemini-2.0-flash-lite", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -83606,16 +95079,16 @@ "supported": false }, "cost": { - "input": 0.06, - "output": 0.12, - "cache_read": 0.012 + "input": 0.076, + "output": 0.304, + "cache_read": 0.076 }, "type": "chat" }, { - "id": "Doubao-lite-4k", - "name": "Doubao-lite-4k", - "display_name": "Doubao-lite-4k", + "id": "gemini-2.0-flash-lite-001", + "name": "gemini-2.0-flash-lite-001", + "display_name": "gemini-2.0-flash-lite-001", "limit": { "context": 8192, "output": 8192 @@ -83625,34 +95098,48 @@ "supported": false }, "cost": { - "input": 0.06, - "output": 0.12, - "cache_read": 0.06 + "input": 0.076, + "output": 0.304, + "cache_read": 0.076 }, "type": "chat" }, { - "id": "Doubao-pro-128k", - "name": "Doubao-pro-128k", - "display_name": "Doubao-pro-128k", + "id": "gemini-2.5-pro-exp-03-25", + "name": "gemini-2.5-pro-exp-03-25", + "display_name": "gemini-2.5-pro-exp-03-25", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ] + }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "cost": { - "input": 0.8, - "output": 1.44 + "input": 1.25, + "output": 5, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "Doubao-pro-256k", - "name": "Doubao-pro-256k", - "display_name": "Doubao-pro-256k", + "id": "gemini-embedding-exp-03-07", + "name": "gemini-embedding-exp-03-07", + "display_name": "gemini-embedding-exp-03-07", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -83662,16 +95149,15 @@ "supported": false }, "cost": { - "input": 0.8, - "output": 1.44, - "cache_read": 0.8 + "input": 0.02, + "output": 0.02 }, - "type": "chat" + "type": "embedding" }, { - "id": "Doubao-pro-32k", - "name": "Doubao-pro-32k", - "display_name": "Doubao-pro-32k", + "id": "gemini-exp-1114", + "name": "gemini-exp-1114", + "display_name": "gemini-exp-1114", "limit": { "context": 8192, "output": 8192 @@ -83681,16 +95167,15 @@ "supported": false }, "cost": { - "input": 0.14, - "output": 0.35, - "cache_read": 0.028 + "input": 1.25, + "output": 5 }, "type": "chat" }, { - "id": "Doubao-pro-4k", - "name": "Doubao-pro-4k", - "display_name": "Doubao-pro-4k", + "id": "gemini-exp-1121", + "name": "gemini-exp-1121", + "display_name": "gemini-exp-1121", "limit": { "context": 8192, "output": 8192 @@ -83700,15 +95185,15 @@ "supported": false }, "cost": { - "input": 0.14, - "output": 0.35 + "input": 1.25, + "output": 5 }, "type": "chat" }, { - "id": "GPT-OSS-20B", - "name": "GPT-OSS-20B", - "display_name": "GPT-OSS-20B", + "id": "gemini-pro", + "name": "gemini-pro", + "display_name": "gemini-pro", "limit": { "context": 8192, "output": 8192 @@ -83718,15 +95203,15 @@ "supported": false }, "cost": { - "input": 0.11, - "output": 0.55 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "Gryphe/MythoMax-L2-13b", - "name": "Gryphe/MythoMax-L2-13b", - "display_name": "Gryphe/MythoMax-L2-13b", + "id": "gemini-pro-vision", + "name": "gemini-pro-vision", + "display_name": "gemini-pro-vision", "limit": { "context": 8192, "output": 8192 @@ -83736,20 +95221,15 @@ "supported": false }, "cost": { - "input": 0.4, - "output": 0.4 + "input": 1, + "output": 1 }, "type": "chat" }, { - "id": "MiniMax-Text-01", - "name": "MiniMax-Text-01", - "display_name": "MiniMax-Text-01", - "modalities": { - "input": [ - "text" - ] - }, + "id": "gemma-7b-it", + "name": "gemma-7b-it", + "display_name": "gemma-7b-it", "limit": { "context": 8192, "output": 8192 @@ -83759,15 +95239,15 @@ "supported": false }, "cost": { - "input": 0.14, - "output": 1.12 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "Mistral-large-2407", - "name": "Mistral-large-2407", - "display_name": "Mistral-large-2407", + "id": "gemma2-9b-it", + "name": "gemma2-9b-it", + "display_name": "gemma2-9b-it", "limit": { "context": 8192, "output": 8192 @@ -83777,15 +95257,15 @@ "supported": false }, "cost": { - "input": 3, - "output": 9 + "input": 0.4, + "output": 0.4 }, "type": "chat" }, { - "id": "Qwen/Qwen2-1.5B-Instruct", - "name": "Qwen/Qwen2-1.5B-Instruct", - "display_name": "Qwen/Qwen2-1.5B-Instruct", + "id": "glm-3-turbo", + "name": "glm-3-turbo", + "display_name": "glm-3-turbo", "limit": { "context": 8192, "output": 8192 @@ -83795,15 +95275,15 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.71, + "output": 0.71 }, "type": "chat" }, { - "id": "Qwen/Qwen2-57B-A14B-Instruct", - "name": "Qwen/Qwen2-57B-A14B-Instruct", - "display_name": "Qwen/Qwen2-57B-A14B-Instruct", + "id": "glm-4", + "name": "glm-4", + "display_name": "glm-4", "limit": { "context": 8192, "output": 8192 @@ -83813,15 +95293,15 @@ "supported": false }, "cost": { - "input": 0.24, - "output": 0.24 + "input": 14.2, + "output": 14.2 }, "type": "chat" }, { - "id": "Qwen/Qwen2-72B-Instruct", - "name": "Qwen/Qwen2-72B-Instruct", - "display_name": "Qwen/Qwen2-72B-Instruct", + "id": "glm-4-flash", + "name": "glm-4-flash", + "display_name": "glm-4-flash", "limit": { "context": 8192, "output": 8192 @@ -83831,15 +95311,15 @@ "supported": false }, "cost": { - "input": 0.8, - "output": 0.8 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "Qwen/Qwen2-7B-Instruct", - "name": "Qwen/Qwen2-7B-Instruct", - "display_name": "Qwen/Qwen2-7B-Instruct", + "id": "glm-4-plus", + "name": "glm-4-plus", + "display_name": "glm-4-plus", "limit": { "context": 8192, "output": 8192 @@ -83849,15 +95329,20 @@ "supported": false }, "cost": { - "input": 0.08, - "output": 0.08 + "input": 8, + "output": 8 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-32B-Instruct", - "name": "Qwen/Qwen2.5-32B-Instruct", - "display_name": "Qwen/Qwen2.5-32B-Instruct", + "id": "glm-4.5-airx", + "name": "glm-4.5-airx", + "display_name": "glm-4.5-airx", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -83867,15 +95352,16 @@ "supported": false }, "cost": { - "input": 0.6, - "output": 0.6 + "input": 1.1, + "output": 4.51, + "cache_read": 0.22 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-72B-Instruct", - "name": "Qwen/Qwen2.5-72B-Instruct", - "display_name": "Qwen/Qwen2.5-72B-Instruct", + "id": "glm-4v", + "name": "glm-4v", + "display_name": "glm-4v", "limit": { "context": 8192, "output": 8192 @@ -83885,15 +95371,15 @@ "supported": false }, "cost": { - "input": 0.8, - "output": 0.8 + "input": 14.2, + "output": 14.2 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-72B-Instruct-128K", - "name": "Qwen/Qwen2.5-72B-Instruct-128K", - "display_name": "Qwen/Qwen2.5-72B-Instruct-128K", + "id": "glm-4v-plus", + "name": "glm-4v-plus", + "display_name": "glm-4v-plus", "limit": { "context": 8192, "output": 8192 @@ -83903,15 +95389,15 @@ "supported": false }, "cost": { - "input": 0.8, - "output": 0.8 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-7B-Instruct", - "name": "Qwen/Qwen2.5-7B-Instruct", - "display_name": "Qwen/Qwen2.5-7B-Instruct", + "id": "google-gemma-3-12b-it", + "name": "google-gemma-3-12b-it", + "display_name": "google-gemma-3-12b-it", "limit": { "context": 8192, "output": 8192 @@ -83921,15 +95407,15 @@ "supported": false }, "cost": { - "input": 0.4, - "output": 0.4 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-Coder-32B-Instruct", - "name": "Qwen/Qwen2.5-Coder-32B-Instruct", - "display_name": "Qwen/Qwen2.5-Coder-32B-Instruct", + "id": "google-gemma-3-27b-it", + "name": "google-gemma-3-27b-it", + "display_name": "google-gemma-3-27b-it", "limit": { "context": 8192, "output": 8192 @@ -83939,15 +95425,16 @@ "supported": false }, "cost": { - "input": 0.16, - "output": 0.16 + "input": 0.2, + "output": 0.2, + "cache_read": 0 }, "type": "chat" }, { - "id": "Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3-235B-A22B-Thinking-2507", - "display_name": "Qwen3-235B-A22B-Thinking-2507", + "id": "google-gemma-3-4b-it", + "name": "google-gemma-3-4b-it", + "display_name": "google-gemma-3-4b-it", "limit": { "context": 8192, "output": 8192 @@ -83957,21 +95444,16 @@ "supported": false }, "cost": { - "input": 0.28, - "output": 2.8 + "input": 0.2, + "output": 0.2, + "cache_read": 0 }, "type": "chat" }, { - "id": "Stable-Diffusion-3-5-Large", - "name": "Stable-Diffusion-3-5-Large", - "display_name": "Stable-Diffusion-3-5-Large", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "google/gemini-exp-1114", + "name": "google/gemini-exp-1114", + "display_name": "google/gemini-exp-1114", "limit": { "context": 8192, "output": 8192 @@ -83981,16 +95463,15 @@ "supported": false }, "cost": { - "input": 4, - "output": 4, - "cache_read": 0 + "input": 1.25, + "output": 5 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "WizardLM/WizardCoder-Python-34B-V1.0", - "name": "WizardLM/WizardCoder-Python-34B-V1.0", - "display_name": "WizardLM/WizardCoder-Python-34B-V1.0", + "id": "google/gemma-2-27b-it", + "name": "google/gemma-2-27b-it", + "display_name": "google/gemma-2-27b-it", "limit": { "context": 8192, "output": 8192 @@ -84000,15 +95481,15 @@ "supported": false }, "cost": { - "input": 0.9, - "output": 0.9 + "input": 0.8, + "output": 0.8 }, "type": "chat" }, { - "id": "ahm-Phi-3-5-MoE-instruct", - "name": "ahm-Phi-3-5-MoE-instruct", - "display_name": "ahm-Phi-3-5-MoE-instruct", + "id": "google/gemma-2-9b-it:free", + "name": "google/gemma-2-9b-it:free", + "display_name": "google/gemma-2-9b-it:free", "limit": { "context": 8192, "output": 8192 @@ -84018,15 +95499,15 @@ "supported": false }, "cost": { - "input": 0.4, - "output": 1.6 + "input": 0.02, + "output": 0.02 }, "type": "chat" }, { - "id": "ahm-Phi-3-5-mini-instruct", - "name": "ahm-Phi-3-5-mini-instruct", - "display_name": "ahm-Phi-3-5-mini-instruct", + "id": "gpt-3.5-turbo", + "name": "gpt-3.5-turbo", + "display_name": "gpt-3.5-turbo", "limit": { "context": 8192, "output": 8192 @@ -84036,21 +95517,15 @@ "supported": false }, "cost": { - "input": 1, - "output": 3 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "ahm-Phi-3-5-vision-instruct", - "name": "ahm-Phi-3-5-vision-instruct", - "display_name": "ahm-Phi-3-5-vision-instruct", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "gpt-3.5-turbo-0301", + "name": "gpt-3.5-turbo-0301", + "display_name": "gpt-3.5-turbo-0301", "limit": { "context": 8192, "output": 8192 @@ -84060,15 +95535,15 @@ "supported": false }, "cost": { - "input": 0.4, - "output": 1.6 + "input": 1.5, + "output": 1.5 }, "type": "chat" }, { - "id": "ahm-Phi-3-medium-128k", - "name": "ahm-Phi-3-medium-128k", - "display_name": "ahm-Phi-3-medium-128k", + "id": "gpt-3.5-turbo-0613", + "name": "gpt-3.5-turbo-0613", + "display_name": "gpt-3.5-turbo-0613", "limit": { "context": 8192, "output": 8192 @@ -84078,15 +95553,15 @@ "supported": false }, "cost": { - "input": 6, - "output": 18 + "input": 1.5, + "output": 2 }, "type": "chat" }, { - "id": "ahm-Phi-3-medium-4k", - "name": "ahm-Phi-3-medium-4k", - "display_name": "ahm-Phi-3-medium-4k", + "id": "gpt-3.5-turbo-1106", + "name": "gpt-3.5-turbo-1106", + "display_name": "gpt-3.5-turbo-1106", "limit": { "context": 8192, "output": 8192 @@ -84097,14 +95572,14 @@ }, "cost": { "input": 1, - "output": 3 + "output": 2 }, "type": "chat" }, { - "id": "ahm-Phi-3-small-128k", - "name": "ahm-Phi-3-small-128k", - "display_name": "ahm-Phi-3-small-128k", + "id": "gpt-3.5-turbo-16k", + "name": "gpt-3.5-turbo-16k", + "display_name": "gpt-3.5-turbo-16k", "limit": { "context": 8192, "output": 8192 @@ -84114,15 +95589,15 @@ "supported": false }, "cost": { - "input": 1, - "output": 3 + "input": 3, + "output": 4 }, "type": "chat" }, { - "id": "aihubmix-Codestral-2501", - "name": "aihubmix-Codestral-2501", - "display_name": "aihubmix-Codestral-2501", + "id": "gpt-3.5-turbo-16k-0613", + "name": "gpt-3.5-turbo-16k-0613", + "display_name": "gpt-3.5-turbo-16k-0613", "limit": { "context": 8192, "output": 8192 @@ -84132,20 +95607,15 @@ "supported": false }, "cost": { - "input": 0.4, - "output": 1.2 + "input": 3, + "output": 4 }, "type": "chat" }, { - "id": "aihubmix-Cohere-command-r", - "name": "aihubmix-Cohere-command-r", - "display_name": "aihubmix-Cohere-command-r", - "modalities": { - "input": [ - "text" - ] - }, + "id": "gpt-3.5-turbo-instruct", + "name": "gpt-3.5-turbo-instruct", + "display_name": "gpt-3.5-turbo-instruct", "limit": { "context": 8192, "output": 8192 @@ -84155,15 +95625,15 @@ "supported": false }, "cost": { - "input": 0.64, - "output": 1.92 + "input": 1.5, + "output": 2 }, "type": "chat" }, { - "id": "aihubmix-Jamba-1-5-Large", - "name": "aihubmix-Jamba-1-5-Large", - "display_name": "aihubmix-Jamba-1-5-Large", + "id": "gpt-4", + "name": "gpt-4", + "display_name": "gpt-4", "limit": { "context": 8192, "output": 8192 @@ -84173,15 +95643,15 @@ "supported": false }, "cost": { - "input": 2.2, - "output": 8.8 + "input": 30, + "output": 60 }, "type": "chat" }, { - "id": "aihubmix-Llama-3-1-405B-Instruct", - "name": "aihubmix-Llama-3-1-405B-Instruct", - "display_name": "aihubmix-Llama-3-1-405B-Instruct", + "id": "gpt-4-0125-preview", + "name": "gpt-4-0125-preview", + "display_name": "gpt-4-0125-preview", "limit": { "context": 8192, "output": 8192 @@ -84191,15 +95661,15 @@ "supported": false }, "cost": { - "input": 5, - "output": 15 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "aihubmix-Llama-3-1-70B-Instruct", - "name": "aihubmix-Llama-3-1-70B-Instruct", - "display_name": "aihubmix-Llama-3-1-70B-Instruct", + "id": "gpt-4-0314", + "name": "gpt-4-0314", + "display_name": "gpt-4-0314", "limit": { "context": 8192, "output": 8192 @@ -84209,15 +95679,15 @@ "supported": false }, "cost": { - "input": 0.6, - "output": 0.78 + "input": 30, + "output": 60 }, "type": "chat" }, { - "id": "aihubmix-Llama-3-1-8B-Instruct", - "name": "aihubmix-Llama-3-1-8B-Instruct", - "display_name": "aihubmix-Llama-3-1-8B-Instruct", + "id": "gpt-4-0613", + "name": "gpt-4-0613", + "display_name": "gpt-4-0613", "limit": { "context": 8192, "output": 8192 @@ -84227,15 +95697,15 @@ "supported": false }, "cost": { - "input": 0.3, - "output": 0.6 + "input": 30, + "output": 60 }, "type": "chat" }, { - "id": "aihubmix-Llama-3-2-11B-Vision", - "name": "aihubmix-Llama-3-2-11B-Vision", - "display_name": "aihubmix-Llama-3-2-11B-Vision", + "id": "gpt-4-1106-preview", + "name": "gpt-4-1106-preview", + "display_name": "gpt-4-1106-preview", "limit": { "context": 8192, "output": 8192 @@ -84245,15 +95715,15 @@ "supported": false }, "cost": { - "input": 0.4, - "output": 0.4 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "aihubmix-Llama-3-2-90B-Vision", - "name": "aihubmix-Llama-3-2-90B-Vision", - "display_name": "aihubmix-Llama-3-2-90B-Vision", + "id": "gpt-4-32k-0314", + "name": "gpt-4-32k-0314", + "display_name": "gpt-4-32k-0314", "limit": { "context": 8192, "output": 8192 @@ -84263,15 +95733,15 @@ "supported": false }, "cost": { - "input": 2.4, - "output": 2.4 + "input": 60, + "output": 120 }, "type": "chat" }, { - "id": "aihubmix-Llama-3-70B-Instruct", - "name": "aihubmix-Llama-3-70B-Instruct", - "display_name": "aihubmix-Llama-3-70B-Instruct", + "id": "gpt-4-32k-0613", + "name": "gpt-4-32k-0613", + "display_name": "gpt-4-32k-0613", "limit": { "context": 8192, "output": 8192 @@ -84281,15 +95751,15 @@ "supported": false }, "cost": { - "input": 0.7, - "output": 0.7 + "input": 60, + "output": 120 }, "type": "chat" }, { - "id": "aihubmix-Mistral-large", - "name": "aihubmix-Mistral-large", - "display_name": "aihubmix-Mistral-large", + "id": "gpt-4-turbo", + "name": "gpt-4-turbo", + "display_name": "gpt-4-turbo", "limit": { "context": 8192, "output": 8192 @@ -84299,20 +95769,15 @@ "supported": false }, "cost": { - "input": 4, - "output": 12 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "aihubmix-command-r-08-2024", - "name": "aihubmix-command-r-08-2024", - "display_name": "aihubmix-command-r-08-2024", - "modalities": { - "input": [ - "text" - ] - }, + "id": "gpt-4-turbo-2024-04-09", + "name": "gpt-4-turbo-2024-04-09", + "display_name": "gpt-4-turbo-2024-04-09", "limit": { "context": 8192, "output": 8192 @@ -84322,20 +95787,15 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.8 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "aihubmix-command-r-plus", - "name": "aihubmix-command-r-plus", - "display_name": "aihubmix-command-r-plus", - "modalities": { - "input": [ - "text" - ] - }, + "id": "gpt-4-turbo-preview", + "name": "gpt-4-turbo-preview", + "display_name": "gpt-4-turbo-preview", "limit": { "context": 8192, "output": 8192 @@ -84345,20 +95805,15 @@ "supported": false }, "cost": { - "input": 3.84, - "output": 19.2 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "aihubmix-command-r-plus-08-2024", - "name": "aihubmix-command-r-plus-08-2024", - "display_name": "aihubmix-command-r-plus-08-2024", - "modalities": { - "input": [ - "text" - ] - }, + "id": "gpt-4-vision-preview", + "name": "gpt-4-vision-preview", + "display_name": "gpt-4-vision-preview", "limit": { "context": 8192, "output": 8192 @@ -84368,33 +95823,40 @@ "supported": false }, "cost": { - "input": 2.8, - "output": 11.2 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "azure-deepseek-v3.2", - "name": "azure-deepseek-v3.2", - "display_name": "azure-deepseek-v3.2", + "id": "gpt-4o-2024-05-13", + "name": "gpt-4o-2024-05-13", + "display_name": "gpt-4o-2024-05-13", "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 128000 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.58, - "output": 1.680028 + "input": 5, + "output": 15, + "cache_read": 5 }, "type": "chat" }, { - "id": "azure-deepseek-v3.2-speciale", - "name": "azure-deepseek-v3.2-speciale", - "display_name": "azure-deepseek-v3.2-speciale", + "id": "gpt-4o-mini-2024-07-18", + "name": "gpt-4o-mini-2024-07-18", + "display_name": "gpt-4o-mini-2024-07-18", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -84404,62 +95866,70 @@ "supported": false }, "cost": { - "input": 0.58, - "output": 1.680028 + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "baidu-deepseek-v3.2", - "name": "baidu-deepseek-v3.2", - "display_name": "baidu-deepseek-v3.2", + "id": "gpt-oss-20b", + "name": "gpt-oss-20b", + "display_name": "gpt-oss-20b", "modalities": { "input": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 128000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "cost": { - "input": 0.274, - "output": 0.411 + "input": 0.11, + "output": 0.55 }, "type": "chat" }, { - "id": "baidu-deepseek-v3.2-exp", - "name": "baidu-deepseek-v3.2-exp", - "display_name": "baidu-deepseek-v3.2-exp", + "id": "grok-2-vision-1212", + "name": "grok-2-vision-1212", + "display_name": "grok-2-vision-1212", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.274, - "output": 0.411, - "cache_read": 0.0274 + "input": 1.8, + "output": 9 }, "type": "chat" }, { - "id": "cerebras-llama-3.3-70b", - "name": "cerebras-llama-3.3-70b", - "display_name": "cerebras-llama-3.3-70b", + "id": "grok-vision-beta", + "name": "grok-vision-beta", + "display_name": "grok-vision-beta", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -84469,15 +95939,15 @@ "supported": false }, "cost": { - "input": 0.6, - "output": 0.6 + "input": 5.6, + "output": 16.8 }, "type": "chat" }, { - "id": "chatglm_lite", - "name": "chatglm_lite", - "display_name": "chatglm_lite", + "id": "groq-llama-3.1-8b-instant", + "name": "groq-llama-3.1-8b-instant", + "display_name": "groq-llama-3.1-8b-instant", "limit": { "context": 8192, "output": 8192 @@ -84487,15 +95957,15 @@ "supported": false }, "cost": { - "input": 0.2858, - "output": 0.2858 + "input": 0.055, + "output": 0.088 }, "type": "chat" }, { - "id": "chatglm_pro", - "name": "chatglm_pro", - "display_name": "chatglm_pro", + "id": "groq-llama-3.3-70b-versatile", + "name": "groq-llama-3.3-70b-versatile", + "display_name": "groq-llama-3.3-70b-versatile", "limit": { "context": 8192, "output": 8192 @@ -84505,15 +95975,15 @@ "supported": false }, "cost": { - "input": 1.4286, - "output": 1.4286 + "input": 0.649, + "output": 0.869011 }, "type": "chat" }, { - "id": "chatglm_std", - "name": "chatglm_std", - "display_name": "chatglm_std", + "id": "groq-llama-4-maverick-17b-128e-instruct", + "name": "groq-llama-4-maverick-17b-128e-instruct", + "display_name": "groq-llama-4-maverick-17b-128e-instruct", "limit": { "context": 8192, "output": 8192 @@ -84523,15 +95993,15 @@ "supported": false }, "cost": { - "input": 0.7144, - "output": 0.7144 + "input": 0.22, + "output": 0.66 }, "type": "chat" }, { - "id": "chatglm_turbo", - "name": "chatglm_turbo", - "display_name": "chatglm_turbo", + "id": "groq-llama-4-scout-17b-16e-instruct", + "name": "groq-llama-4-scout-17b-16e-instruct", + "display_name": "groq-llama-4-scout-17b-16e-instruct", "limit": { "context": 8192, "output": 8192 @@ -84541,15 +96011,21 @@ "supported": false }, "cost": { - "input": 0.7144, - "output": 0.7144 + "input": 0.122, + "output": 0.366 }, "type": "chat" }, { - "id": "claude-2", - "name": "claude-2", - "display_name": "claude-2", + "id": "imagen-4.0-generate-preview-05-20", + "name": "imagen-4.0-generate-preview-05-20", + "display_name": "imagen-4.0-generate-preview-05-20", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -84559,15 +96035,21 @@ "supported": false }, "cost": { - "input": 8.8, - "output": 8.8 + "input": 2, + "output": 2, + "cache_read": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "claude-2.0", - "name": "claude-2.0", - "display_name": "claude-2.0", + "id": "jina-embeddings-v2-base-code", + "name": "jina-embeddings-v2-base-code", + "display_name": "jina-embeddings-v2-base-code", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -84577,15 +96059,15 @@ "supported": false }, "cost": { - "input": 8.8, - "output": 39.6 + "input": 0.05, + "output": 0.05 }, - "type": "chat" + "type": "embedding" }, { - "id": "claude-2.1", - "name": "claude-2.1", - "display_name": "claude-2.1", + "id": "learnlm-1.5-pro-experimental", + "name": "learnlm-1.5-pro-experimental", + "display_name": "learnlm-1.5-pro-experimental", "limit": { "context": 8192, "output": 8192 @@ -84595,45 +96077,33 @@ "supported": false }, "cost": { - "input": 8.8, - "output": 39.6 + "input": 1.25, + "output": 5 }, "type": "chat" }, { - "id": "claude-3-5-sonnet-20240620", - "name": "claude-3-5-sonnet-20240620", - "display_name": "claude-3-5-sonnet-20240620", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "llama-3.1-405b-instruct", + "name": "llama-3.1-405b-instruct", + "display_name": "llama-3.1-405b-instruct", "limit": { - "context": 200000, - "output": 200000 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 3.3, - "output": 16.5 + "input": 4, + "output": 4 }, "type": "chat" }, { - "id": "claude-3-haiku-20240229", - "name": "claude-3-haiku-20240229", - "display_name": "claude-3-haiku-20240229", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "llama-3.1-405b-reasoning", + "name": "llama-3.1-405b-reasoning", + "display_name": "llama-3.1-405b-reasoning", "limit": { "context": 8192, "output": 8192 @@ -84643,21 +96113,15 @@ "supported": false }, "cost": { - "input": 0.275, - "output": 0.275 + "input": 4, + "output": 4 }, "type": "chat" }, { - "id": "claude-3-haiku-20240307", - "name": "claude-3-haiku-20240307", - "display_name": "claude-3-haiku-20240307", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "llama-3.1-70b-versatile", + "name": "llama-3.1-70b-versatile", + "display_name": "llama-3.1-70b-versatile", "limit": { "context": 8192, "output": 8192 @@ -84667,21 +96131,15 @@ "supported": false }, "cost": { - "input": 0.275, - "output": 1.375 + "input": 0.6, + "output": 0.6 }, "type": "chat" }, { - "id": "claude-3-sonnet-20240229", - "name": "claude-3-sonnet-20240229", - "display_name": "claude-3-sonnet-20240229", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "llama-3.1-8b-instant", + "name": "llama-3.1-8b-instant", + "display_name": "llama-3.1-8b-instant", "limit": { "context": 8192, "output": 8192 @@ -84691,15 +96149,15 @@ "supported": false }, "cost": { - "input": 3.3, - "output": 16.5 + "input": 0.3, + "output": 0.6 }, "type": "chat" }, { - "id": "claude-instant-1", - "name": "claude-instant-1", - "display_name": "claude-instant-1", + "id": "llama-3.1-sonar-small-128k-online", + "name": "llama-3.1-sonar-small-128k-online", + "display_name": "llama-3.1-sonar-small-128k-online", "limit": { "context": 8192, "output": 8192 @@ -84709,15 +96167,15 @@ "supported": false }, "cost": { - "input": 1.793, - "output": 1.793 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "claude-instant-1.2", - "name": "claude-instant-1.2", - "display_name": "claude-instant-1.2", + "id": "llama-3.2-11b-vision-preview", + "name": "llama-3.2-11b-vision-preview", + "display_name": "llama-3.2-11b-vision-preview", "limit": { "context": 8192, "output": 8192 @@ -84727,15 +96185,15 @@ "supported": false }, "cost": { - "input": 0.88, - "output": 3.96 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "code-davinci-edit-001", - "name": "code-davinci-edit-001", - "display_name": "code-davinci-edit-001", + "id": "llama-3.2-1b-preview", + "name": "llama-3.2-1b-preview", + "display_name": "llama-3.2-1b-preview", "limit": { "context": 8192, "output": 8192 @@ -84745,15 +96203,15 @@ "supported": false }, "cost": { - "input": 20, - "output": 20 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "cogview-3", - "name": "cogview-3", - "display_name": "cogview-3", + "id": "llama-3.2-3b-preview", + "name": "llama-3.2-3b-preview", + "display_name": "llama-3.2-3b-preview", "limit": { "context": 8192, "output": 8192 @@ -84763,15 +96221,15 @@ "supported": false }, "cost": { - "input": 35.5, - "output": 35.5 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "cogview-3-plus", - "name": "cogview-3-plus", - "display_name": "cogview-3-plus", + "id": "llama-3.2-90b-vision-preview", + "name": "llama-3.2-90b-vision-preview", + "display_name": "llama-3.2-90b-vision-preview", "limit": { "context": 8192, "output": 8192 @@ -84781,20 +96239,15 @@ "supported": false }, "cost": { - "input": 10, - "output": 10 + "input": 2.4, + "output": 2.4 }, "type": "chat" }, { - "id": "command", - "name": "command", - "display_name": "command", - "modalities": { - "input": [ - "text" - ] - }, + "id": "llama2-70b-4096", + "name": "llama2-70b-4096", + "display_name": "llama2-70b-4096", "limit": { "context": 8192, "output": 8192 @@ -84804,15 +96257,15 @@ "supported": false }, "cost": { - "input": 1, - "output": 2 + "input": 0.5, + "output": 0.5 }, "type": "chat" }, { - "id": "command-light", - "name": "command-light", - "display_name": "command-light", + "id": "llama2-70b-40960", + "name": "llama2-70b-40960", + "display_name": "llama2-70b-40960", "limit": { "context": 8192, "output": 8192 @@ -84822,15 +96275,15 @@ "supported": false }, "cost": { - "input": 1, - "output": 2 + "input": 0.5, + "output": 0.5 }, "type": "chat" }, { - "id": "command-light-nightly", - "name": "command-light-nightly", - "display_name": "command-light-nightly", + "id": "llama2-7b-2048", + "name": "llama2-7b-2048", + "display_name": "llama2-7b-2048", "limit": { "context": 8192, "output": 8192 @@ -84840,15 +96293,15 @@ "supported": false }, "cost": { - "input": 1, - "output": 2 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "command-nightly", - "name": "command-nightly", - "display_name": "command-nightly", + "id": "llama3-70b-8192", + "name": "llama3-70b-8192", + "display_name": "llama3-70b-8192", "limit": { "context": 8192, "output": 8192 @@ -84858,20 +96311,15 @@ "supported": false }, "cost": { - "input": 1, - "output": 2 + "input": 0.7, + "output": 0.937288 }, "type": "chat" }, { - "id": "command-r", - "name": "command-r", - "display_name": "command-r", - "modalities": { - "input": [ - "text" - ] - }, + "id": "llama3-8b-8192", + "name": "llama3-8b-8192", + "display_name": "llama3-8b-8192", "limit": { "context": 8192, "output": 8192 @@ -84881,20 +96329,15 @@ "supported": false }, "cost": { - "input": 0.64, - "output": 1.92 + "input": 0.06, + "output": 0.12 }, "type": "chat" }, { - "id": "command-r-08-2024", - "name": "command-r-08-2024", - "display_name": "command-r-08-2024", - "modalities": { - "input": [ - "text" - ] - }, + "id": "llama3-groq-70b-8192-tool-use-preview", + "name": "llama3-groq-70b-8192-tool-use-preview", + "display_name": "llama3-groq-70b-8192-tool-use-preview", "limit": { "context": 8192, "output": 8192 @@ -84904,20 +96347,15 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.8 + "input": 0.00089, + "output": 0.00089 }, "type": "chat" }, { - "id": "command-r-plus", - "name": "command-r-plus", - "display_name": "command-r-plus", - "modalities": { - "input": [ - "text" - ] - }, + "id": "llama3-groq-8b-8192-tool-use-preview", + "name": "llama3-groq-8b-8192-tool-use-preview", + "display_name": "llama3-groq-8b-8192-tool-use-preview", "limit": { "context": 8192, "output": 8192 @@ -84927,20 +96365,15 @@ "supported": false }, "cost": { - "input": 3.84, - "output": 19.2 + "input": 0.00019, + "output": 0.00019 }, "type": "chat" }, { - "id": "command-r-plus-08-2024", - "name": "command-r-plus-08-2024", - "display_name": "command-r-plus-08-2024", - "modalities": { - "input": [ - "text" - ] - }, + "id": "meta-llama/Llama-3.2-90B-Vision-Instruct", + "name": "meta-llama/Llama-3.2-90B-Vision-Instruct", + "display_name": "meta-llama/Llama-3.2-90B-Vision-Instruct", "limit": { "context": 8192, "output": 8192 @@ -84950,21 +96383,15 @@ "supported": false }, "cost": { - "input": 2.8, - "output": 11.2 + "input": 0.5, + "output": 0.5 }, "type": "chat" }, { - "id": "dall-e-2", - "name": "dall-e-2", - "display_name": "dall-e-2", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "meta-llama/llama-3.1-405b-instruct:free", + "name": "meta-llama/llama-3.1-405b-instruct:free", + "display_name": "meta-llama/llama-3.1-405b-instruct:free", "limit": { "context": 8192, "output": 8192 @@ -84974,15 +96401,15 @@ "supported": false }, "cost": { - "input": 16, - "output": 16 + "input": 0.02, + "output": 0.02 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "davinci", - "name": "davinci", - "display_name": "davinci", + "id": "meta-llama/llama-3.1-70b-instruct:free", + "name": "meta-llama/llama-3.1-70b-instruct:free", + "display_name": "meta-llama/llama-3.1-70b-instruct:free", "limit": { "context": 8192, "output": 8192 @@ -84992,15 +96419,15 @@ "supported": false }, "cost": { - "input": 20, - "output": 20 + "input": 0.02, + "output": 0.02 }, "type": "chat" }, { - "id": "davinci-002", - "name": "davinci-002", - "display_name": "davinci-002", + "id": "meta-llama/llama-3.1-8b-instruct:free", + "name": "meta-llama/llama-3.1-8b-instruct:free", + "display_name": "meta-llama/llama-3.1-8b-instruct:free", "limit": { "context": 8192, "output": 8192 @@ -85010,15 +96437,15 @@ "supported": false }, "cost": { - "input": 2, - "output": 2 + "input": 0.02, + "output": 0.02 }, "type": "chat" }, { - "id": "deepinfra-llama-3.1-8b-instant", - "name": "deepinfra-llama-3.1-8b-instant", - "display_name": "deepinfra-llama-3.1-8b-instant", + "id": "meta-llama/llama-3.2-11b-vision-instruct:free", + "name": "meta-llama/llama-3.2-11b-vision-instruct:free", + "display_name": "meta-llama/llama-3.2-11b-vision-instruct:free", "limit": { "context": 8192, "output": 8192 @@ -85028,15 +96455,15 @@ "supported": false }, "cost": { - "input": 0.033, - "output": 0.054978 + "input": 0.02, + "output": 0.02 }, "type": "chat" }, { - "id": "deepinfra-llama-3.3-70b-instant-turbo", - "name": "deepinfra-llama-3.3-70b-instant-turbo", - "display_name": "deepinfra-llama-3.3-70b-instant-turbo", + "id": "meta-llama/llama-3.2-3b-instruct:free", + "name": "meta-llama/llama-3.2-3b-instruct:free", + "display_name": "meta-llama/llama-3.2-3b-instruct:free", "limit": { "context": 8192, "output": 8192 @@ -85046,15 +96473,15 @@ "supported": false }, "cost": { - "input": 0.11, - "output": 0.352 + "input": 0.02, + "output": 0.02 }, "type": "chat" }, { - "id": "deepinfra-llama-4-maverick-17b-128e-instruct", - "name": "deepinfra-llama-4-maverick-17b-128e-instruct", - "display_name": "deepinfra-llama-4-maverick-17b-128e-instruct", + "id": "meta/llama-3.1-405b-instruct", + "name": "meta/llama-3.1-405b-instruct", + "display_name": "meta/llama-3.1-405b-instruct", "limit": { "context": 8192, "output": 8192 @@ -85064,15 +96491,15 @@ "supported": false }, "cost": { - "input": 1.65, - "output": 6.6 + "input": 5, + "output": 5 }, "type": "chat" }, { - "id": "deepinfra-llama-4-scout-17b-16e-instruct", - "name": "deepinfra-llama-4-scout-17b-16e-instruct", - "display_name": "deepinfra-llama-4-scout-17b-16e-instruct", + "id": "meta/llama3-8B-chat", + "name": "meta/llama3-8B-chat", + "display_name": "meta/llama3-8B-chat", "limit": { "context": 8192, "output": 8192 @@ -85082,16 +96509,15 @@ "supported": false }, "cost": { - "input": 0.088, - "output": 0.33, - "cache_read": 0 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-Coder-V2-Instruct", - "name": "deepseek-ai/DeepSeek-Coder-V2-Instruct", - "display_name": "deepseek-ai/DeepSeek-Coder-V2-Instruct", + "id": "Baichuan3-Turbo", + "name": "Baichuan3-Turbo", + "display_name": "Baichuan3-Turbo", "limit": { "context": 8192, "output": 8192 @@ -85101,15 +96527,15 @@ "supported": false }, "cost": { - "input": 0.16, - "output": 0.32 + "input": 1.9, + "output": 1.9 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", + "id": "Baichuan3-Turbo-128k", + "name": "Baichuan3-Turbo-128k", + "display_name": "Baichuan3-Turbo-128k", "limit": { "context": 8192, "output": 8192 @@ -85119,15 +96545,15 @@ "supported": false }, "cost": { - "input": 0.6, - "output": 0.6 + "input": 3.8, + "output": 3.8 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", + "id": "Baichuan4", + "name": "Baichuan4", + "display_name": "Baichuan4", "limit": { "context": 8192, "output": 8192 @@ -85137,15 +96563,15 @@ "supported": false }, "cost": { - "input": 0.01, - "output": 0.01 + "input": 16, + "output": 16 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B", + "id": "Baichuan4-Air", + "name": "Baichuan4-Air", + "display_name": "Baichuan4-Air", "limit": { "context": 8192, "output": 8192 @@ -85155,15 +96581,15 @@ "supported": false }, "cost": { - "input": 0.01, - "output": 0.01 + "input": 0.16, + "output": 0.16 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "id": "Baichuan4-Turbo", + "name": "Baichuan4-Turbo", + "display_name": "Baichuan4-Turbo", "limit": { "context": 8192, "output": 8192 @@ -85173,15 +96599,15 @@ "supported": false }, "cost": { - "input": 0.1, - "output": 0.1 + "input": 2.4, + "output": 2.4 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "id": "DeepSeek-v3", + "name": "DeepSeek-v3", + "display_name": "DeepSeek-v3", "limit": { "context": 8192, "output": 8192 @@ -85191,15 +96617,15 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.272, + "output": 1.088 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "id": "Doubao-1.5-lite-32k", + "name": "Doubao-1.5-lite-32k", + "display_name": "Doubao-1.5-lite-32k", "limit": { "context": 8192, "output": 8192 @@ -85209,15 +96635,16 @@ "supported": false }, "cost": { - "input": 0.01, - "output": 0.01 + "input": 0.05, + "output": 0.1, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V2-Chat", - "name": "deepseek-ai/DeepSeek-V2-Chat", - "display_name": "deepseek-ai/DeepSeek-V2-Chat", + "id": "Doubao-1.5-pro-256k", + "name": "Doubao-1.5-pro-256k", + "display_name": "Doubao-1.5-pro-256k", "limit": { "context": 8192, "output": 8192 @@ -85227,15 +96654,16 @@ "supported": false }, "cost": { - "input": 0.16, - "output": 0.32 + "input": 0.8, + "output": 1.44, + "cache_read": 0.8 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V2.5", - "name": "deepseek-ai/DeepSeek-V2.5", - "display_name": "deepseek-ai/DeepSeek-V2.5", + "id": "Doubao-1.5-pro-32k", + "name": "Doubao-1.5-pro-32k", + "display_name": "Doubao-1.5-pro-32k", "limit": { "context": 8192, "output": 8192 @@ -85245,15 +96673,16 @@ "supported": false }, "cost": { - "input": 0.16, - "output": 0.32 + "input": 0.134, + "output": 0.335, + "cache_read": 0.0268 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-llm-67b-chat", - "name": "deepseek-ai/deepseek-llm-67b-chat", - "display_name": "deepseek-ai/deepseek-llm-67b-chat", + "id": "Doubao-1.5-vision-pro-32k", + "name": "Doubao-1.5-vision-pro-32k", + "display_name": "Doubao-1.5-vision-pro-32k", "limit": { "context": 8192, "output": 8192 @@ -85263,15 +96692,15 @@ "supported": false }, "cost": { - "input": 0.16, - "output": 0.16 + "input": 0.46, + "output": 1.38 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-vl2", - "name": "deepseek-ai/deepseek-vl2", - "display_name": "deepseek-ai/deepseek-vl2", + "id": "Doubao-lite-128k", + "name": "Doubao-lite-128k", + "display_name": "Doubao-lite-128k", "limit": { "context": 8192, "output": 8192 @@ -85281,15 +96710,16 @@ "supported": false }, "cost": { - "input": 0.16, - "output": 0.16 + "input": 0.14, + "output": 0.28, + "cache_read": 0.14 }, "type": "chat" }, { - "id": "deepseek-v3", - "name": "deepseek-v3", - "display_name": "deepseek-v3", + "id": "Doubao-lite-32k", + "name": "Doubao-lite-32k", + "display_name": "Doubao-lite-32k", "limit": { "context": 8192, "output": 8192 @@ -85299,21 +96729,16 @@ "supported": false }, "cost": { - "input": 0.272, - "output": 1.088, - "cache_read": 0 + "input": 0.06, + "output": 0.12, + "cache_read": 0.012 }, "type": "chat" }, { - "id": "distil-whisper-large-v3-en", - "name": "distil-whisper-large-v3-en", - "display_name": "distil-whisper-large-v3-en", - "modalities": { - "input": [ - "audio" - ] - }, + "id": "Doubao-lite-4k", + "name": "Doubao-lite-4k", + "display_name": "Doubao-lite-4k", "limit": { "context": 8192, "output": 8192 @@ -85323,15 +96748,16 @@ "supported": false }, "cost": { - "input": 5.556, - "output": 5.556 + "input": 0.06, + "output": 0.12, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "doubao-1-5-thinking-vision-pro-250428", - "name": "doubao-1-5-thinking-vision-pro-250428", - "display_name": "doubao-1-5-thinking-vision-pro-250428", + "id": "Doubao-pro-128k", + "name": "Doubao-pro-128k", + "display_name": "Doubao-pro-128k", "limit": { "context": 8192, "output": 8192 @@ -85341,16 +96767,15 @@ "supported": false }, "cost": { - "input": 2, - "output": 2, - "cache_read": 2 + "input": 0.8, + "output": 1.44 }, "type": "chat" }, { - "id": "aistudio_gemini-2.0-flash", - "name": "aistudio_gemini-2.0-flash", - "display_name": "aistudio_gemini-2.0-flash", + "id": "Doubao-pro-256k", + "name": "Doubao-pro-256k", + "display_name": "Doubao-pro-256k", "limit": { "context": 8192, "output": 8192 @@ -85360,16 +96785,16 @@ "supported": false }, "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.25 + "input": 0.8, + "output": 1.44, + "cache_read": 0.8 }, "type": "chat" }, { - "id": "aistudio_gpt-4.1-mini", - "name": "aistudio_gpt-4.1-mini", - "display_name": "aistudio_gpt-4.1-mini", + "id": "Doubao-pro-32k", + "name": "Doubao-pro-32k", + "display_name": "Doubao-pro-32k", "limit": { "context": 8192, "output": 8192 @@ -85379,16 +96804,16 @@ "supported": false }, "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 0.14, + "output": 0.35, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "deepseek-r1-distill-qianfan-llama-8b", - "name": "deepseek-r1-distill-qianfan-llama-8b", - "display_name": "deepseek-r1-distill-qianfan-llama-8b", + "id": "Doubao-pro-4k", + "name": "Doubao-pro-4k", + "display_name": "Doubao-pro-4k", "limit": { "context": 8192, "output": 8192 @@ -85398,15 +96823,15 @@ "supported": false }, "cost": { - "input": 0.137, - "output": 0.548 + "input": 0.14, + "output": 0.35 }, "type": "chat" }, { - "id": "doubao-1-5-pro-256k-250115", - "name": "doubao-1-5-pro-256k-250115", - "display_name": "doubao-1-5-pro-256k-250115", + "id": "GPT-OSS-20B", + "name": "GPT-OSS-20B", + "display_name": "GPT-OSS-20B", "limit": { "context": 8192, "output": 8192 @@ -85416,15 +96841,15 @@ "supported": false }, "cost": { - "input": 0.684, - "output": 1.2312 + "input": 0.11, + "output": 0.55 }, "type": "chat" }, { - "id": "doubao-1-5-pro-32k-250115", - "name": "doubao-1-5-pro-32k-250115", - "display_name": "doubao-1-5-pro-32k-250115", + "id": "Gryphe/MythoMax-L2-13b", + "name": "Gryphe/MythoMax-L2-13b", + "display_name": "Gryphe/MythoMax-L2-13b", "limit": { "context": 8192, "output": 8192 @@ -85434,15 +96859,20 @@ "supported": false }, "cost": { - "input": 0.108, - "output": 0.27 + "input": 0.4, + "output": 0.4 }, "type": "chat" }, { - "id": "gpt-4o-2024-08-06-global", - "name": "gpt-4o-2024-08-06-global", - "display_name": "gpt-4o-2024-08-06-global", + "id": "MiniMax-Text-01", + "name": "MiniMax-Text-01", + "display_name": "MiniMax-Text-01", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -85452,16 +96882,15 @@ "supported": false }, "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.14, + "output": 1.12 }, "type": "chat" }, { - "id": "gpt-4o-mini-global", - "name": "gpt-4o-mini-global", - "display_name": "gpt-4o-mini-global", + "id": "Mistral-large-2407", + "name": "Mistral-large-2407", + "display_name": "Mistral-large-2407", "limit": { "context": 8192, "output": 8192 @@ -85471,16 +96900,15 @@ "supported": false }, "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075 + "input": 3, + "output": 9 }, "type": "chat" }, { - "id": "meta-llama-3-70b", - "name": "meta-llama-3-70b", - "display_name": "meta-llama-3-70b", + "id": "Qwen/Qwen2-1.5B-Instruct", + "name": "Qwen/Qwen2-1.5B-Instruct", + "display_name": "Qwen/Qwen2-1.5B-Instruct", "limit": { "context": 8192, "output": 8192 @@ -85490,15 +96918,15 @@ "supported": false }, "cost": { - "input": 4.795, - "output": 4.795 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "meta-llama-3-8b", - "name": "meta-llama-3-8b", - "display_name": "meta-llama-3-8b", + "id": "Qwen/Qwen2-57B-A14B-Instruct", + "name": "Qwen/Qwen2-57B-A14B-Instruct", + "display_name": "Qwen/Qwen2-57B-A14B-Instruct", "limit": { "context": 8192, "output": 8192 @@ -85508,15 +96936,15 @@ "supported": false }, "cost": { - "input": 0.548, - "output": 0.548 + "input": 0.24, + "output": 0.24 }, "type": "chat" }, { - "id": "o3-global", - "name": "o3-global", - "display_name": "o3-global", + "id": "Qwen/Qwen2-72B-Instruct", + "name": "Qwen/Qwen2-72B-Instruct", + "display_name": "Qwen/Qwen2-72B-Instruct", "limit": { "context": 8192, "output": 8192 @@ -85526,16 +96954,15 @@ "supported": false }, "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.8, + "output": 0.8 }, "type": "chat" }, { - "id": "o3-mini-global", - "name": "o3-mini-global", - "display_name": "o3-mini-global", + "id": "Qwen/Qwen2-7B-Instruct", + "name": "Qwen/Qwen2-7B-Instruct", + "display_name": "Qwen/Qwen2-7B-Instruct", "limit": { "context": 8192, "output": 8192 @@ -85545,16 +96972,15 @@ "supported": false }, "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.08, + "output": 0.08 }, "type": "chat" }, { - "id": "o3-pro-global", - "name": "o3-pro-global", - "display_name": "o3-pro-global", + "id": "Qwen/Qwen2.5-32B-Instruct", + "name": "Qwen/Qwen2.5-32B-Instruct", + "display_name": "Qwen/Qwen2.5-32B-Instruct", "limit": { "context": 8192, "output": 8192 @@ -85564,15 +96990,15 @@ "supported": false }, "cost": { - "input": 20, - "output": 80 + "input": 0.6, + "output": 0.6 }, "type": "chat" }, { - "id": "qianfan-chinese-llama-2-13b", - "name": "qianfan-chinese-llama-2-13b", - "display_name": "qianfan-chinese-llama-2-13b", + "id": "Qwen/Qwen2.5-72B-Instruct", + "name": "Qwen/Qwen2.5-72B-Instruct", + "display_name": "Qwen/Qwen2.5-72B-Instruct", "limit": { "context": 8192, "output": 8192 @@ -85582,15 +97008,15 @@ "supported": false }, "cost": { - "input": 0.822, - "output": 0.822 + "input": 0.8, + "output": 0.8 }, "type": "chat" }, { - "id": "qianfan-llama-vl-8b", - "name": "qianfan-llama-vl-8b", - "display_name": "qianfan-llama-vl-8b", + "id": "Qwen/Qwen2.5-72B-Instruct-128K", + "name": "Qwen/Qwen2.5-72B-Instruct-128K", + "display_name": "Qwen/Qwen2.5-72B-Instruct-128K", "limit": { "context": 8192, "output": 8192 @@ -85600,2115 +97026,1713 @@ "supported": false }, "cost": { - "input": 0.274, - "output": 0.685 + "input": 0.8, + "output": 0.8 }, "type": "chat" - } - ] - }, - "openrouter": { - "id": "openrouter", - "name": "OpenRouter", - "display_name": "OpenRouter", - "models": [ + }, { - "id": "ai21/jamba-large-1.7", - "name": "AI21: Jamba Large 1.7", - "display_name": "AI21: Jamba Large 1.7", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "Qwen/Qwen2.5-7B-Instruct", + "name": "Qwen/Qwen2.5-7B-Instruct", + "display_name": "Qwen/Qwen2.5-7B-Instruct", "limit": { - "context": 256000, - "output": 4096 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, + "cost": { + "input": 0.4, + "output": 0.4 + }, "type": "chat" }, { - "id": "ai21/jamba-mini-1.7", - "name": "AI21: Jamba Mini 1.7", - "display_name": "AI21: Jamba Mini 1.7", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "Qwen/Qwen2.5-Coder-32B-Instruct", + "name": "Qwen/Qwen2.5-Coder-32B-Instruct", + "display_name": "Qwen/Qwen2.5-Coder-32B-Instruct", "limit": { - "context": 256000, - "output": 4096 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, + "cost": { + "input": 0.16, + "output": 0.16 + }, "type": "chat" }, { - "id": "aion-labs/aion-1.0", - "name": "AionLabs: Aion-1.0", - "display_name": "AionLabs: Aion-1.0", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3-235B-A22B-Thinking-2507", + "display_name": "Qwen3-235B-A22B-Thinking-2507", "limit": { - "context": 131072, - "output": 32768 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "cost": { + "input": 0.28, + "output": 2.8 }, "type": "chat" }, { - "id": "aion-labs/aion-1.0-mini", - "name": "AionLabs: Aion-1.0-Mini", - "display_name": "AionLabs: Aion-1.0-Mini", + "id": "Stable-Diffusion-3-5-Large", + "name": "Stable-Diffusion-3-5-Large", + "display_name": "Stable-Diffusion-3-5-Large", "modalities": { "input": [ - "text" - ], - "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "cost": { + "input": 4, + "output": 4, + "cache_read": 0 + }, + "type": "imageGeneration" }, { - "id": "aion-labs/aion-rp-llama-3.1-8b", - "name": "AionLabs: Aion-RP 1.0 (8B)", - "display_name": "AionLabs: Aion-RP 1.0 (8B)", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "WizardLM/WizardCoder-Python-34B-V1.0", + "name": "WizardLM/WizardCoder-Python-34B-V1.0", + "display_name": "WizardLM/WizardCoder-Python-34B-V1.0", "limit": { - "context": 32768, - "output": 32768 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, + "cost": { + "input": 0.9, + "output": 0.9 + }, "type": "chat" }, { - "id": "alfredpros/codellama-7b-instruct-solidity", - "name": "AlfredPros: CodeLLaMa 7B Instruct Solidity", - "display_name": "AlfredPros: CodeLLaMa 7B Instruct Solidity", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "ahm-Phi-3-5-MoE-instruct", + "name": "ahm-Phi-3-5-MoE-instruct", + "display_name": "ahm-Phi-3-5-MoE-instruct", "limit": { - "context": 4096, - "output": 4096 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, + "cost": { + "input": 0.4, + "output": 1.6 + }, "type": "chat" }, { - "id": "alibaba/tongyi-deepresearch-30b-a3b", - "name": "Tongyi DeepResearch 30B A3B", - "display_name": "Tongyi DeepResearch 30B A3B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "ahm-Phi-3-5-mini-instruct", + "name": "ahm-Phi-3-5-mini-instruct", + "display_name": "ahm-Phi-3-5-mini-instruct", "limit": { - "context": 131072, - "output": 131072 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "cost": { + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "allenai/olmo-2-0325-32b-instruct", - "name": "AllenAI: Olmo 2 32B Instruct", - "display_name": "AllenAI: Olmo 2 32B Instruct", + "id": "ahm-Phi-3-5-vision-instruct", + "name": "ahm-Phi-3-5-vision-instruct", + "display_name": "ahm-Phi-3-5-vision-instruct", "modalities": { "input": [ - "text" - ], - "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, + "cost": { + "input": 0.4, + "output": 1.6 + }, "type": "chat" }, { - "id": "allenai/olmo-3-32b-think", - "name": "AllenAI: Olmo 3 32B Think", - "display_name": "AllenAI: Olmo 3 32B Think", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "ahm-Phi-3-medium-128k", + "name": "ahm-Phi-3-medium-128k", + "display_name": "ahm-Phi-3-medium-128k", "limit": { - "context": 65536, - "output": 65536 + "context": 8192, + "output": 8192 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "cost": { + "input": 6, + "output": 18 }, "type": "chat" }, { - "id": "allenai/olmo-3-7b-instruct", - "name": "AllenAI: Olmo 3 7B Instruct", - "display_name": "AllenAI: Olmo 3 7B Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "ahm-Phi-3-medium-4k", + "name": "ahm-Phi-3-medium-4k", + "display_name": "ahm-Phi-3-medium-4k", "limit": { - "context": 65536, - "output": 65536 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, + "cost": { + "input": 1, + "output": 3 + }, "type": "chat" }, { - "id": "allenai/olmo-3-7b-think", - "name": "AllenAI: Olmo 3 7B Think", - "display_name": "AllenAI: Olmo 3 7B Think", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "ahm-Phi-3-small-128k", + "name": "ahm-Phi-3-small-128k", + "display_name": "ahm-Phi-3-small-128k", "limit": { - "context": 65536, - "output": 65536 + "context": 8192, + "output": 8192 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "cost": { + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "allenai/olmo-3.1-32b-instruct", - "name": "AllenAI: Olmo 3.1 32B Instruct", - "display_name": "AllenAI: Olmo 3.1 32B Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "aihubmix-Codestral-2501", + "name": "aihubmix-Codestral-2501", + "display_name": "aihubmix-Codestral-2501", "limit": { - "context": 65536, - "output": 65536 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, + "cost": { + "input": 0.4, + "output": 1.2 + }, "type": "chat" }, { - "id": "allenai/olmo-3.1-32b-think", - "name": "AllenAI: Olmo 3.1 32B Think", - "display_name": "AllenAI: Olmo 3.1 32B Think", + "id": "aihubmix-Cohere-command-r", + "name": "aihubmix-Cohere-command-r", + "display_name": "aihubmix-Cohere-command-r", "modalities": { "input": [ "text" - ], - "output": [ - "text" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 8192, + "output": 8192 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "cost": { + "input": 0.64, + "output": 1.92 }, "type": "chat" }, { - "id": "alpindale/goliath-120b", - "name": "Goliath 120B", - "display_name": "Goliath 120B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "aihubmix-Jamba-1-5-Large", + "name": "aihubmix-Jamba-1-5-Large", + "display_name": "aihubmix-Jamba-1-5-Large", "limit": { - "context": 6144, - "output": 1024 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, + "cost": { + "input": 2.2, + "output": 8.8 + }, "type": "chat" }, { - "id": "amazon/nova-2-lite-v1", - "name": "Amazon: Nova 2 Lite", - "display_name": "Amazon: Nova 2 Lite", - "modalities": { - "input": [ - "text", - "image", - "video" - ], - "output": [ - "text" - ] - }, + "id": "aihubmix-Llama-3-1-405B-Instruct", + "name": "aihubmix-Llama-3-1-405B-Instruct", + "display_name": "aihubmix-Llama-3-1-405B-Instruct", "limit": { - "context": 1000000, - "output": 65535 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "cost": { + "input": 5, + "output": 15 + }, + "type": "chat" }, { - "id": "amazon/nova-lite-v1", - "name": "Amazon: Nova Lite 1.0", - "display_name": "Amazon: Nova Lite 1.0", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, + "id": "aihubmix-Llama-3-1-70B-Instruct", + "name": "aihubmix-Llama-3-1-70B-Instruct", + "display_name": "aihubmix-Llama-3-1-70B-Instruct", "limit": { - "context": 300000, - "output": 5120 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "type": "imageGeneration" + "cost": { + "input": 0.6, + "output": 0.78 + }, + "type": "chat" }, { - "id": "amazon/nova-micro-v1", - "name": "Amazon: Nova Micro 1.0", - "display_name": "Amazon: Nova Micro 1.0", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "aihubmix-Llama-3-1-8B-Instruct", + "name": "aihubmix-Llama-3-1-8B-Instruct", + "display_name": "aihubmix-Llama-3-1-8B-Instruct", "limit": { - "context": 128000, - "output": 5120 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, + "cost": { + "input": 0.3, + "output": 0.6 + }, "type": "chat" }, { - "id": "amazon/nova-premier-v1", - "name": "Amazon: Nova Premier 1.0", - "display_name": "Amazon: Nova Premier 1.0", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, + "id": "aihubmix-Llama-3-2-11B-Vision", + "name": "aihubmix-Llama-3-2-11B-Vision", + "display_name": "aihubmix-Llama-3-2-11B-Vision", "limit": { - "context": 1000000, - "output": 32000 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "type": "imageGeneration" + "cost": { + "input": 0.4, + "output": 0.4 + }, + "type": "chat" }, { - "id": "amazon/nova-pro-v1", - "name": "Amazon: Nova Pro 1.0", - "display_name": "Amazon: Nova Pro 1.0", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, + "id": "aihubmix-Llama-3-2-90B-Vision", + "name": "aihubmix-Llama-3-2-90B-Vision", + "display_name": "aihubmix-Llama-3-2-90B-Vision", "limit": { - "context": 300000, - "output": 5120 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "type": "imageGeneration" + "cost": { + "input": 2.4, + "output": 2.4 + }, + "type": "chat" }, { - "id": "anthracite-org/magnum-v4-72b", - "name": "Magnum v4 72B", - "display_name": "Magnum v4 72B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "aihubmix-Llama-3-70B-Instruct", + "name": "aihubmix-Llama-3-70B-Instruct", + "display_name": "aihubmix-Llama-3-70B-Instruct", "limit": { - "context": 16384, - "output": 2048 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, + "cost": { + "input": 0.7, + "output": 0.7 + }, "type": "chat" }, { - "id": "anthropic/claude-3-haiku", - "name": "Anthropic: Claude 3 Haiku", - "display_name": "Anthropic: Claude 3 Haiku", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, + "id": "aihubmix-Mistral-large", + "name": "aihubmix-Mistral-large", + "display_name": "aihubmix-Mistral-large", "limit": { - "context": 200000, - "output": 4096 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "imageGeneration" + "cost": { + "input": 4, + "output": 12 + }, + "type": "chat" }, { - "id": "anthropic/claude-3.5-haiku", - "name": "Anthropic: Claude 3.5 Haiku", - "display_name": "Anthropic: Claude 3.5 Haiku", + "id": "aihubmix-command-r-08-2024", + "name": "aihubmix-command-r-08-2024", + "display_name": "aihubmix-command-r-08-2024", "modalities": { "input": [ - "text", - "image" - ], - "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "imageGeneration" + "cost": { + "input": 0.2, + "output": 0.8 + }, + "type": "chat" }, { - "id": "anthropic/claude-3.5-haiku-20241022", - "name": "Anthropic: Claude 3.5 Haiku (2024-10-22)", - "display_name": "Anthropic: Claude 3.5 Haiku (2024-10-22)", + "id": "aihubmix-command-r-plus", + "name": "aihubmix-command-r-plus", + "display_name": "aihubmix-command-r-plus", "modalities": { "input": [ - "text", - "image" - ], - "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "type": "imageGeneration" + "cost": { + "input": 3.84, + "output": 19.2 + }, + "type": "chat" }, { - "id": "anthropic/claude-3.5-sonnet", - "name": "Anthropic: Claude 3.5 Sonnet", - "display_name": "Anthropic: Claude 3.5 Sonnet", + "id": "aihubmix-command-r-plus-08-2024", + "name": "aihubmix-command-r-plus-08-2024", + "display_name": "aihubmix-command-r-plus-08-2024", "modalities": { "input": [ - "text", - "image" - ], - "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "type": "imageGeneration" + "cost": { + "input": 2.8, + "output": 11.2 + }, + "type": "chat" }, { - "id": "anthropic/claude-3.7-sonnet", - "name": "Anthropic: Claude 3.7 Sonnet", - "display_name": "Anthropic: Claude 3.7 Sonnet", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, + "id": "alicloud-deepseek-v3.2", + "name": "alicloud-deepseek-v3.2", + "display_name": "alicloud-deepseek-v3.2", "limit": { - "context": 200000, - "output": 64000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "cost": { + "input": 0.274, + "output": 0.411, + "cache_read": 0.0548 + }, + "type": "chat" }, { - "id": "anthropic/claude-3.7-sonnet:thinking", - "name": "Anthropic: Claude 3.7 Sonnet (thinking)", - "display_name": "Anthropic: Claude 3.7 Sonnet (thinking)", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, + "id": "alicloud-glm-4.6", + "name": "alicloud-glm-4.6", + "display_name": "alicloud-glm-4.6", "limit": { - "context": 200000, - "output": 64000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "cost": { + "input": 0.41096, + "output": 1.917539, + "cache_read": 0.41096 + }, + "type": "chat" }, { - "id": "anthropic/claude-haiku-4.5", - "name": "Anthropic: Claude Haiku 4.5", - "display_name": "Anthropic: Claude Haiku 4.5", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "text" - ] - }, + "id": "alicloud-glm-4.7", + "name": "alicloud-glm-4.7", + "display_name": "alicloud-glm-4.7", "limit": { - "context": 200000, - "output": 64000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "imageGeneration" + "cost": { + "input": 0.41096, + "output": 1.917786, + "cache_read": 0.41096 + }, + "type": "chat" }, { - "id": "anthropic/claude-opus-4", - "name": "Anthropic: Claude Opus 4", - "display_name": "Anthropic: Claude Opus 4", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "text" - ] + "id": "alicloud-kimi-k2-instruct", + "name": "alicloud-kimi-k2-instruct", + "display_name": "alicloud-kimi-k2-instruct", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.548, + "output": 2.192 }, + "type": "chat" + }, + { + "id": "alicloud-kimi-k2-thinking", + "name": "alicloud-kimi-k2-thinking", + "display_name": "alicloud-kimi-k2-thinking", "limit": { - "context": 200000, - "output": 32000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "cost": { + "input": 0.548, + "output": 2.192 + }, + "type": "chat" }, { - "id": "anthropic/claude-opus-4.1", - "name": "Anthropic: Claude Opus 4.1", - "display_name": "Anthropic: Claude Opus 4.1", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "text" - ] - }, + "id": "azure-deepseek-v3.2", + "name": "azure-deepseek-v3.2", + "display_name": "azure-deepseek-v3.2", "limit": { - "context": 200000, - "output": 200000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "cost": { + "input": 0.58, + "output": 1.680028 + }, + "type": "chat" }, { - "id": "anthropic/claude-opus-4.5", - "name": "Anthropic: Claude Opus 4.5", - "display_name": "Anthropic: Claude Opus 4.5", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "text" - ] - }, + "id": "azure-deepseek-v3.2-speciale", + "name": "azure-deepseek-v3.2-speciale", + "display_name": "azure-deepseek-v3.2-speciale", "limit": { - "context": 200000, - "output": 32000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "cost": { + "input": 0.58, + "output": 1.680028 + }, + "type": "chat" }, { - "id": "anthropic/claude-sonnet-4", - "name": "Anthropic: Claude Sonnet 4", - "display_name": "Anthropic: Claude Sonnet 4", + "id": "baidu-deepseek-v3.2", + "name": "baidu-deepseek-v3.2", + "display_name": "baidu-deepseek-v3.2", "modalities": { "input": [ - "image", - "text" - ], - "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 8192, + "output": 8192 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "cost": { + "input": 0.274, + "output": 0.411 + }, + "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.5", - "name": "Anthropic: Claude Sonnet 4.5", - "display_name": "Anthropic: Claude Sonnet 4.5", + "id": "baidu-deepseek-v3.2-exp", + "name": "baidu-deepseek-v3.2-exp", + "display_name": "baidu-deepseek-v3.2-exp", "modalities": { "input": [ - "text", - "image" - ], - "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 8192, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "cost": { + "input": 0.274, + "output": 0.411, + "cache_read": 0.0274 + }, + "type": "chat" }, { - "id": "arcee-ai/coder-large", - "name": "Arcee AI: Coder Large", - "display_name": "Arcee AI: Coder Large", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "cbs-glm-4.7", + "name": "cbs-glm-4.7", + "display_name": "cbs-glm-4.7", "limit": { - "context": 32768, - "output": 32768 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, + "cost": { + "input": 2.25, + "output": 2.749995 + }, "type": "chat" }, { - "id": "arcee-ai/maestro-reasoning", - "name": "Arcee AI: Maestro Reasoning", - "display_name": "Arcee AI: Maestro Reasoning", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "cerebras-llama-3.3-70b", + "name": "cerebras-llama-3.3-70b", + "display_name": "cerebras-llama-3.3-70b", "limit": { - "context": 131072, - "output": 32000 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, + "cost": { + "input": 0.6, + "output": 0.6 + }, "type": "chat" }, { - "id": "arcee-ai/spotlight", - "name": "Arcee AI: Spotlight", - "display_name": "Arcee AI: Spotlight", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "text" - ] - }, + "id": "chatglm_lite", + "name": "chatglm_lite", + "display_name": "chatglm_lite", "limit": { - "context": 131072, - "output": 65537 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "type": "imageGeneration" + "cost": { + "input": 0.2858, + "output": 0.2858 + }, + "type": "chat" }, { - "id": "arcee-ai/trinity-mini", - "name": "Arcee AI: Trinity Mini", - "display_name": "Arcee AI: Trinity Mini", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "chatglm_pro", + "name": "chatglm_pro", + "display_name": "chatglm_pro", "limit": { - "context": 131072, - "output": 131072 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "cost": { + "input": 1.4286, + "output": 1.4286 }, "type": "chat" }, { - "id": "arcee-ai/trinity-mini:free", - "name": "Arcee AI: Trinity Mini (free)", - "display_name": "Arcee AI: Trinity Mini (free)", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "chatglm_std", + "name": "chatglm_std", + "display_name": "chatglm_std", "limit": { - "context": 131072, - "output": 131072 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "cost": { + "input": 0.7144, + "output": 0.7144 }, "type": "chat" }, { - "id": "arcee-ai/virtuoso-large", - "name": "Arcee AI: Virtuoso Large", - "display_name": "Arcee AI: Virtuoso Large", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "chatglm_turbo", + "name": "chatglm_turbo", + "display_name": "chatglm_turbo", "limit": { - "context": 131072, - "output": 64000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, + "cost": { + "input": 0.7144, + "output": 0.7144 + }, "type": "chat" }, { - "id": "baidu/ernie-4.5-21b-a3b", - "name": "Baidu: ERNIE 4.5 21B A3B", - "display_name": "Baidu: ERNIE 4.5 21B A3B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "claude-2", + "name": "claude-2", + "display_name": "claude-2", "limit": { - "context": 120000, - "output": 8000 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, + "cost": { + "input": 8.8, + "output": 8.8 + }, "type": "chat" }, { - "id": "baidu/ernie-4.5-21b-a3b-thinking", - "name": "Baidu: ERNIE 4.5 21B A3B Thinking", - "display_name": "Baidu: ERNIE 4.5 21B A3B Thinking", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "claude-2.0", + "name": "claude-2.0", + "display_name": "claude-2.0", "limit": { - "context": 131072, - "output": 65536 + "context": 8192, + "output": 8192 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "cost": { + "input": 8.8, + "output": 39.6 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-300b-a47b", - "name": "Baidu: ERNIE 4.5 300B A47B", - "display_name": "Baidu: ERNIE 4.5 300B A47B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "claude-2.1", + "name": "claude-2.1", + "display_name": "claude-2.1", "limit": { - "context": 123000, - "output": 12000 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, + "cost": { + "input": 8.8, + "output": 39.6 + }, "type": "chat" }, { - "id": "baidu/ernie-4.5-vl-28b-a3b", - "name": "Baidu: ERNIE 4.5 VL 28B A3B", - "display_name": "Baidu: ERNIE 4.5 VL 28B A3B", + "id": "claude-3-5-sonnet-20240620", + "name": "claude-3-5-sonnet-20240620", + "display_name": "claude-3-5-sonnet-20240620", "modalities": { "input": [ "text", "image" - ], - "output": [ - "text" ] }, "limit": { - "context": 30000, - "output": 8000 + "context": 200000, + "output": 200000 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "imageGeneration" + "cost": { + "input": 3.3, + "output": 16.5 + }, + "type": "chat" }, { - "id": "baidu/ernie-4.5-vl-424b-a47b", - "name": "Baidu: ERNIE 4.5 VL 424B A47B", - "display_name": "Baidu: ERNIE 4.5 VL 424B A47B", + "id": "claude-3-haiku-20240229", + "name": "claude-3-haiku-20240229", + "display_name": "claude-3-haiku-20240229", "modalities": { "input": [ - "image", - "text" - ], - "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 123000, - "output": 16000 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "imageGeneration" + "cost": { + "input": 0.275, + "output": 0.275 + }, + "type": "chat" }, { - "id": "bytedance-seed/seed-1.6", - "name": "ByteDance Seed: Seed 1.6", - "display_name": "ByteDance Seed: Seed 1.6", + "id": "claude-3-haiku-20240307", + "name": "claude-3-haiku-20240307", + "display_name": "claude-3-haiku-20240307", "modalities": { "input": [ - "image", "text", - "video" - ], - "output": [ - "text" + "image" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "imageGeneration" + "cost": { + "input": 0.275, + "output": 1.375 + }, + "type": "chat" }, { - "id": "bytedance-seed/seed-1.6-flash", - "name": "ByteDance Seed: Seed 1.6 Flash", - "display_name": "ByteDance Seed: Seed 1.6 Flash", + "id": "claude-3-sonnet-20240229", + "name": "claude-3-sonnet-20240229", + "display_name": "claude-3-sonnet-20240229", "modalities": { "input": [ - "image", "text", - "video" - ], - "output": [ - "text" + "image" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "imageGeneration" + "cost": { + "input": 3.3, + "output": 16.5 + }, + "type": "chat" }, { - "id": "bytedance/ui-tars-1.5-7b", - "name": "ByteDance: UI-TARS 7B", - "display_name": "ByteDance: UI-TARS 7B", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "text" - ] - }, + "id": "claude-instant-1", + "name": "claude-instant-1", + "display_name": "claude-instant-1", "limit": { - "context": 128000, - "output": 2048 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "type": "imageGeneration" + "cost": { + "input": 1.793, + "output": 1.793 + }, + "type": "chat" }, { - "id": "cognitivecomputations/dolphin-mistral-24b-venice-edition:free", - "name": "Venice: Uncensored (free)", - "display_name": "Venice: Uncensored (free)", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "claude-instant-1.2", + "name": "claude-instant-1.2", + "display_name": "claude-instant-1.2", "limit": { - "context": 32768, - "output": 32768 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" - }, - { - "id": "cohere/command-a", - "name": "Cohere: Command A", - "display_name": "Cohere: Command A", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] + "cost": { + "input": 0.88, + "output": 3.96 }, + "type": "chat" + }, + { + "id": "code-davinci-edit-001", + "name": "code-davinci-edit-001", + "display_name": "code-davinci-edit-001", "limit": { - "context": 256000, + "context": 8192, "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, + "cost": { + "input": 20, + "output": 20 + }, "type": "chat" }, { - "id": "cohere/command-r-08-2024", - "name": "Cohere: Command R (08-2024)", - "display_name": "Cohere: Command R (08-2024)", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "cogview-3", + "name": "cogview-3", + "display_name": "cogview-3", "limit": { - "context": 128000, - "output": 4000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, + "cost": { + "input": 35.5, + "output": 35.5 + }, "type": "chat" }, { - "id": "cohere/command-r-plus-08-2024", - "name": "Cohere: Command R+ (08-2024)", - "display_name": "Cohere: Command R+ (08-2024)", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "cogview-3-plus", + "name": "cogview-3-plus", + "display_name": "cogview-3-plus", "limit": { - "context": 128000, - "output": 4000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, + "cost": { + "input": 10, + "output": 10 + }, "type": "chat" }, { - "id": "cohere/command-r7b-12-2024", - "name": "Cohere: Command R7B (12-2024)", - "display_name": "Cohere: Command R7B (12-2024)", + "id": "command", + "name": "command", + "display_name": "command", "modalities": { "input": [ "text" - ], - "output": [ - "text" ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, + "cost": { + "input": 1, + "output": 2 + }, "type": "chat" }, { - "id": "deepcogito/cogito-v2-preview-llama-109b-moe", - "name": "Cogito V2 Preview Llama 109B", - "display_name": "Cogito V2 Preview Llama 109B", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "text" - ] - }, + "id": "command-light", + "name": "command-light", + "display_name": "command-light", "limit": { - "context": 32767, - "output": 32767 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "type": "imageGeneration" - }, - { - "id": "deepcogito/cogito-v2-preview-llama-405b", - "name": "Deep Cogito: Cogito V2 Preview Llama 405B", - "display_name": "Deep Cogito: Cogito V2 Preview Llama 405B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 32768, - "output": 32768 + "supported": false }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true + "cost": { + "input": 1, + "output": 2 }, "type": "chat" }, { - "id": "deepcogito/cogito-v2-preview-llama-70b", - "name": "Deep Cogito: Cogito V2 Preview Llama 70B", - "display_name": "Deep Cogito: Cogito V2 Preview Llama 70B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "command-light-nightly", + "name": "command-light-nightly", + "display_name": "command-light-nightly", "limit": { - "context": 32768, - "output": 32768 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "cost": { + "input": 1, + "output": 2 }, "type": "chat" }, { - "id": "deepcogito/cogito-v2.1-671b", - "name": "Deep Cogito: Cogito v2.1 671B", - "display_name": "Deep Cogito: Cogito v2.1 671B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "command-nightly", + "name": "command-nightly", + "display_name": "command-nightly", "limit": { - "context": 128000, - "output": 128000 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "cost": { + "input": 1, + "output": 2 }, "type": "chat" }, { - "id": "deepseek/deepseek-chat", - "name": "DeepSeek: DeepSeek V3", - "display_name": "DeepSeek: DeepSeek V3", + "id": "command-r", + "name": "command-r", + "display_name": "command-r", "modalities": { "input": [ "text" - ], - "output": [ - "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, + "cost": { + "input": 0.64, + "output": 1.92 + }, "type": "chat" }, { - "id": "deepseek/deepseek-chat-v3-0324", - "name": "DeepSeek: DeepSeek V3 0324", - "display_name": "DeepSeek: DeepSeek V3 0324", + "id": "command-r-08-2024", + "name": "command-r-08-2024", + "display_name": "command-r-08-2024", "modalities": { "input": [ "text" - ], - "output": [ - "text" ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "cost": { + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "deepseek/deepseek-chat-v3.1", - "name": "DeepSeek: DeepSeek V3.1", - "display_name": "DeepSeek: DeepSeek V3.1", + "id": "command-r-plus", + "name": "command-r-plus", + "display_name": "command-r-plus", "modalities": { "input": [ "text" - ], - "output": [ - "text" ] }, "limit": { - "context": 32768, - "output": 7168 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "cost": { + "input": 3.84, + "output": 19.2 }, "type": "chat" }, { - "id": "deepseek/deepseek-prover-v2", - "name": "DeepSeek: DeepSeek Prover V2", - "display_name": "DeepSeek: DeepSeek Prover V2", + "id": "command-r-plus-08-2024", + "name": "command-r-plus-08-2024", + "display_name": "command-r-plus-08-2024", "modalities": { "input": [ "text" - ], - "output": [ - "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, + "cost": { + "input": 2.8, + "output": 11.2 + }, "type": "chat" }, { - "id": "deepseek/deepseek-r1", - "name": "DeepSeek: R1", - "display_name": "DeepSeek: R1", + "id": "dall-e-2", + "name": "dall-e-2", + "display_name": "dall-e-2", "modalities": { "input": [ - "text" - ], - "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "cost": { + "input": 16, + "output": 16 + }, + "type": "imageGeneration" }, { - "id": "deepseek/deepseek-r1-0528", - "name": "DeepSeek: R1 0528", - "display_name": "DeepSeek: R1 0528", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "davinci", + "name": "davinci", + "display_name": "davinci", "limit": { - "context": 163840, - "output": 65536 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "cost": { + "input": 20, + "output": 20 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-0528-qwen3-8b", - "name": "DeepSeek: DeepSeek R1 0528 Qwen3 8B", - "display_name": "DeepSeek: DeepSeek R1 0528 Qwen3 8B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "davinci-002", + "name": "davinci-002", + "display_name": "davinci-002", "limit": { - "context": 128000, - "output": 32000 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "cost": { + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-0528:free", - "name": "DeepSeek: R1 0528 (free)", - "display_name": "DeepSeek: R1 0528 (free)", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "deepinfra-llama-3.1-8b-instant", + "name": "deepinfra-llama-3.1-8b-instant", + "display_name": "deepinfra-llama-3.1-8b-instant", "limit": { - "context": 163840, - "output": 163840 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "cost": { + "input": 0.033, + "output": 0.054978 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-distill-llama-70b", - "name": "DeepSeek: R1 Distill Llama 70B", - "display_name": "DeepSeek: R1 Distill Llama 70B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "deepinfra-llama-3.3-70b-instant-turbo", + "name": "deepinfra-llama-3.3-70b-instant-turbo", + "display_name": "deepinfra-llama-3.3-70b-instant-turbo", "limit": { - "context": 131072, - "output": 131072 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "cost": { + "input": 0.11, + "output": 0.352 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-distill-qwen-14b", - "name": "DeepSeek: R1 Distill Qwen 14B", - "display_name": "DeepSeek: R1 Distill Qwen 14B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "deepinfra-llama-4-maverick-17b-128e-instruct", + "name": "deepinfra-llama-4-maverick-17b-128e-instruct", + "display_name": "deepinfra-llama-4-maverick-17b-128e-instruct", "limit": { - "context": 32768, - "output": 16384 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "cost": { + "input": 1.65, + "output": 6.6 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-distill-qwen-32b", - "name": "DeepSeek: R1 Distill Qwen 32B", - "display_name": "DeepSeek: R1 Distill Qwen 32B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "deepinfra-llama-4-scout-17b-16e-instruct", + "name": "deepinfra-llama-4-scout-17b-16e-instruct", + "display_name": "deepinfra-llama-4-scout-17b-16e-instruct", "limit": { - "context": 131072, - "output": 131072 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "cost": { + "input": 0.088, + "output": 0.33, + "cache_read": 0 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.1-terminus", - "name": "DeepSeek: DeepSeek V3.1 Terminus", - "display_name": "DeepSeek: DeepSeek V3.1 Terminus", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "deepseek-ai/DeepSeek-Coder-V2-Instruct", + "name": "deepseek-ai/DeepSeek-Coder-V2-Instruct", + "display_name": "deepseek-ai/DeepSeek-Coder-V2-Instruct", "limit": { - "context": 163840, - "output": 163840 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "cost": { + "input": 0.16, + "output": 0.32 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.1-terminus:exacto", - "name": "DeepSeek: DeepSeek V3.1 Terminus (exacto)", - "display_name": "DeepSeek: DeepSeek V3.1 Terminus (exacto)", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", "limit": { - "context": 163840, - "output": 163840 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "cost": { + "input": 0.6, + "output": 0.6 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2", - "name": "DeepSeek: DeepSeek V3.2", - "display_name": "DeepSeek: DeepSeek V3.2", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", "limit": { - "context": 163840, - "output": 65536 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" - }, - { - "id": "deepseek/deepseek-v3.2-exp", - "name": "DeepSeek: DeepSeek V3.2 Exp", - "display_name": "DeepSeek: DeepSeek V3.2 Exp", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] + "cost": { + "input": 0.01, + "output": 0.01 }, + "type": "chat" + }, + { + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B", "limit": { - "context": 163840, - "output": 65536 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "cost": { + "input": 0.01, + "output": 0.01 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-speciale", - "name": "DeepSeek: DeepSeek V3.2 Speciale", - "display_name": "DeepSeek: DeepSeek V3.2 Speciale", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", "limit": { - "context": 163840, - "output": 65536 + "context": 8192, + "output": 8192 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "cost": { + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "eleutherai/llemma_7b", - "name": "EleutherAI: Llemma 7b", - "display_name": "EleutherAI: Llemma 7b", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", "limit": { - "context": 4096, - "output": 4096 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, + "cost": { + "input": 0.2, + "output": 0.2 + }, "type": "chat" }, { - "id": "essentialai/rnj-1-instruct", - "name": "EssentialAI: Rnj 1 Instruct", - "display_name": "EssentialAI: Rnj 1 Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", "limit": { - "context": 32768, - "output": 32768 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, + "cost": { + "input": 0.01, + "output": 0.01 + }, "type": "chat" }, { - "id": "google/gemini-2.0-flash-001", - "name": "Google: Gemini 2.0 Flash", - "display_name": "Google: Gemini 2.0 Flash", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video" - ], - "output": [ - "text" - ] - }, + "id": "deepseek-ai/DeepSeek-V2-Chat", + "name": "deepseek-ai/DeepSeek-V2-Chat", + "display_name": "deepseek-ai/DeepSeek-V2-Chat", "limit": { - "context": 1048576, + "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "type": "imageGeneration" + "cost": { + "input": 0.16, + "output": 0.32 + }, + "type": "chat" }, { - "id": "google/gemini-2.0-flash-exp:free", - "name": "Google: Gemini 2.0 Flash Experimental (free)", - "display_name": "Google: Gemini 2.0 Flash Experimental (free)", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, + "id": "deepseek-ai/DeepSeek-V2.5", + "name": "deepseek-ai/DeepSeek-V2.5", + "display_name": "deepseek-ai/DeepSeek-V2.5", "limit": { - "context": 1048576, + "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "imageGeneration" + "cost": { + "input": 0.16, + "output": 0.32 + }, + "type": "chat" }, { - "id": "google/gemini-2.0-flash-lite-001", - "name": "Google: Gemini 2.0 Flash Lite", - "display_name": "Google: Gemini 2.0 Flash Lite", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video" - ], - "output": [ - "text" - ] - }, + "id": "deepseek-ai/deepseek-llm-67b-chat", + "name": "deepseek-ai/deepseek-llm-67b-chat", + "display_name": "deepseek-ai/deepseek-llm-67b-chat", "limit": { - "context": 1048576, + "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "type": "imageGeneration" + "cost": { + "input": 0.16, + "output": 0.16 + }, + "type": "chat" }, { - "id": "google/gemini-2.5-flash", - "name": "Google: Gemini 2.5 Flash", - "display_name": "Google: Gemini 2.5 Flash", - "modalities": { - "input": [ - "image", - "text", - "audio", - "video" - ], - "output": [ - "text" - ] - }, + "id": "deepseek-ai/deepseek-vl2", + "name": "deepseek-ai/deepseek-vl2", + "display_name": "deepseek-ai/deepseek-vl2", "limit": { - "context": 1048576, - "output": 65535 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "cost": { + "input": 0.16, + "output": 0.16 + }, + "type": "chat" }, { - "id": "google/gemini-2.5-flash-image", - "name": "Google: Gemini 2.5 Flash Image (Nano Banana)", - "display_name": "Google: Gemini 2.5 Flash Image (Nano Banana)", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "image", - "text" - ] - }, + "id": "deepseek-v3", + "name": "deepseek-v3", + "display_name": "deepseek-v3", "limit": { - "context": 32768, - "output": 32768 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "type": "imageGeneration" + "cost": { + "input": 0.272, + "output": 1.088, + "cache_read": 0 + }, + "type": "chat" }, { - "id": "google/gemini-2.5-flash-image-preview", - "name": "Google: Gemini 2.5 Flash Image Preview (Nano Banana)", - "display_name": "Google: Gemini 2.5 Flash Image Preview (Nano Banana)", + "id": "distil-whisper-large-v3-en", + "name": "distil-whisper-large-v3-en", + "display_name": "distil-whisper-large-v3-en", "modalities": { "input": [ - "image", - "text" - ], - "output": [ - "image", - "text" + "audio" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "type": "imageGeneration" + "cost": { + "input": 5.556, + "output": 5.556 + }, + "type": "chat" }, { - "id": "google/gemini-2.5-flash-lite", - "name": "Google: Gemini 2.5 Flash Lite", - "display_name": "Google: Gemini 2.5 Flash Lite", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video" - ], - "output": [ - "text" - ] - }, + "id": "doubao-1-5-thinking-vision-pro-250428", + "name": "doubao-1-5-thinking-vision-pro-250428", + "display_name": "doubao-1-5-thinking-vision-pro-250428", "limit": { - "context": 1048576, - "output": 65535 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "cost": { + "input": 2, + "output": 2, + "cache_read": 2 + }, + "type": "chat" }, { - "id": "google/gemini-2.5-flash-lite-preview-09-2025", - "name": "Google: Gemini 2.5 Flash Lite Preview 09-2025", - "display_name": "Google: Gemini 2.5 Flash Lite Preview 09-2025", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video" - ], - "output": [ - "text" - ] - }, + "id": "aistudio_gemini-2.0-flash", + "name": "aistudio_gemini-2.0-flash", + "display_name": "aistudio_gemini-2.0-flash", "limit": { - "context": 1048576, - "output": 65536 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.25 + }, + "type": "chat" }, { - "id": "google/gemini-2.5-flash-preview-09-2025", - "name": "Google: Gemini 2.5 Flash Preview 09-2025", - "display_name": "Google: Gemini 2.5 Flash Preview 09-2025", - "modalities": { - "input": [ - "image", - "text", - "audio", - "video" - ], - "output": [ - "text" - ] - }, + "id": "aistudio_gpt-4.1-mini", + "name": "aistudio_gpt-4.1-mini", + "display_name": "aistudio_gpt-4.1-mini", "limit": { - "context": 1048576, - "output": 65536 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "cost": { + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 + }, + "type": "chat" }, { - "id": "google/gemini-2.5-pro", - "name": "Google: Gemini 2.5 Pro", - "display_name": "Google: Gemini 2.5 Pro", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video" - ], - "output": [ - "text" - ] - }, + "id": "deepseek-r1-distill-qianfan-llama-8b", + "name": "deepseek-r1-distill-qianfan-llama-8b", + "display_name": "deepseek-r1-distill-qianfan-llama-8b", "limit": { - "context": 1048576, - "output": 65536 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "cost": { + "input": 0.137, + "output": 0.548 + }, + "type": "chat" }, { - "id": "google/gemini-2.5-pro-preview", - "name": "Google: Gemini 2.5 Pro Preview 06-05", - "display_name": "Google: Gemini 2.5 Pro Preview 06-05", - "modalities": { - "input": [ - "image", - "text", - "audio" - ], - "output": [ - "text" - ] - }, + "id": "doubao-1-5-pro-256k-250115", + "name": "doubao-1-5-pro-256k-250115", + "display_name": "doubao-1-5-pro-256k-250115", "limit": { - "context": 1048576, - "output": 65536 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "cost": { + "input": 0.684, + "output": 1.2312 + }, + "type": "chat" }, { - "id": "google/gemini-2.5-pro-preview-05-06", - "name": "Google: Gemini 2.5 Pro Preview 05-06", - "display_name": "Google: Gemini 2.5 Pro Preview 05-06", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video" - ], - "output": [ - "text" - ] - }, + "id": "doubao-1-5-pro-32k-250115", + "name": "doubao-1-5-pro-32k-250115", + "display_name": "doubao-1-5-pro-32k-250115", "limit": { - "context": 1048576, - "output": 65535 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "cost": { + "input": 0.108, + "output": 0.27 + }, + "type": "chat" }, { - "id": "google/gemini-3-flash-preview", - "name": "Google: Gemini 3 Flash Preview", - "display_name": "Google: Gemini 3 Flash Preview", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video" - ], - "output": [ - "text" - ] - }, + "id": "gpt-4o-2024-08-06-global", + "name": "gpt-4o-2024-08-06-global", + "display_name": "gpt-4o-2024-08-06-global", "limit": { - "context": 1048576, - "output": 65535 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "cost": { + "input": 2.5, + "output": 10, + "cache_read": 1.25 + }, + "type": "chat" }, { - "id": "google/gemini-3-pro-image-preview", - "name": "Google: Nano Banana Pro (Gemini 3 Pro Image Preview)", - "display_name": "Google: Nano Banana Pro (Gemini 3 Pro Image Preview)", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "image", - "text" - ] - }, + "id": "gpt-4o-mini-global", + "name": "gpt-4o-mini-global", + "display_name": "gpt-4o-mini-global", "limit": { - "context": 65536, - "output": 32768 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "google/gemini-3-pro-preview", - "name": "Google: Gemini 3 Pro Preview", - "display_name": "Google: Gemini 3 Pro Preview", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video" - ], - "output": [ - "text" - ] - }, + "id": "meta-llama-3-70b", + "name": "meta-llama-3-70b", + "display_name": "meta-llama-3-70b", "limit": { - "context": 1048576, - "output": 65536 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "cost": { + "input": 4.795, + "output": 4.795 + }, + "type": "chat" }, { - "id": "google/gemma-2-27b-it", - "name": "Google: Gemma 2 27B", - "display_name": "Google: Gemma 2 27B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "meta-llama-3-8b", + "name": "meta-llama-3-8b", + "display_name": "meta-llama-3-8b", "limit": { "context": 8192, "output": 8192 @@ -87717,20 +98741,16 @@ "reasoning": { "supported": false }, + "cost": { + "input": 0.548, + "output": 0.548 + }, "type": "chat" }, { - "id": "google/gemma-2-9b-it", - "name": "Google: Gemma 2 9B", - "display_name": "Google: Gemma 2 9B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, + "id": "o3-global", + "name": "o3-global", + "display_name": "o3-global", "limit": { "context": 8192, "output": 8192 @@ -87739,150 +98759,141 @@ "reasoning": { "supported": false }, + "cost": { + "input": 2, + "output": 8, + "cache_read": 0.5 + }, "type": "chat" }, { - "id": "google/gemma-3-12b-it", - "name": "Google: Gemma 3 12B", - "display_name": "Google: Gemma 3 12B", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, + "id": "o3-mini-global", + "name": "o3-mini-global", + "display_name": "o3-mini-global", "limit": { - "context": 131072, - "output": 131072 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "type": "imageGeneration" + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 + }, + "type": "chat" }, { - "id": "google/gemma-3-12b-it:free", - "name": "Google: Gemma 3 12B (free)", - "display_name": "Google: Gemma 3 12B (free)", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, + "id": "o3-pro-global", + "name": "o3-pro-global", + "display_name": "o3-pro-global", "limit": { - "context": 32768, + "context": 8192, "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "type": "imageGeneration" + "cost": { + "input": 20, + "output": 80 + }, + "type": "chat" }, { - "id": "google/gemma-3-27b-it", - "name": "Google: Gemma 3 27B", - "display_name": "Google: Gemma 3 27B", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, + "id": "qianfan-chinese-llama-2-13b", + "name": "qianfan-chinese-llama-2-13b", + "display_name": "qianfan-chinese-llama-2-13b", "limit": { - "context": 96000, - "output": 96000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "imageGeneration" + "cost": { + "input": 0.822, + "output": 0.822 + }, + "type": "chat" }, { - "id": "google/gemma-3-27b-it:free", - "name": "Google: Gemma 3 27B (free)", - "display_name": "Google: Gemma 3 27B (free)", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, + "id": "qianfan-llama-vl-8b", + "name": "qianfan-llama-vl-8b", + "display_name": "qianfan-llama-vl-8b", "limit": { - "context": 131072, - "output": 131072 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "imageGeneration" - }, + "cost": { + "input": 0.274, + "output": 0.685 + }, + "type": "chat" + } + ] + }, + "openrouter": { + "id": "openrouter", + "name": "OpenRouter", + "display_name": "OpenRouter", + "models": [ { - "id": "google/gemma-3-4b-it", - "name": "Google: Gemma 3 4B", - "display_name": "Google: Gemma 3 4B", + "id": "ai21/jamba-large-1.7", + "name": "AI21: Jamba Large 1.7", + "display_name": "AI21: Jamba Large 1.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 96000, - "output": 96000 + "context": 256000, + "output": 4096 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "google/gemma-3-4b-it:free", - "name": "Google: Gemma 3 4B (free)", - "display_name": "Google: Gemma 3 4B (free)", + "id": "ai21/jamba-mini-1.7", + "name": "AI21: Jamba Mini 1.7", + "display_name": "AI21: Jamba Mini 1.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 256000, + "output": 4096 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "google/gemma-3n-e2b-it:free", - "name": "Google: Gemma 3n 2B (free)", - "display_name": "Google: Gemma 3n 2B (free)", + "id": "aion-labs/aion-1.0", + "name": "AionLabs: Aion-1.0", + "display_name": "AionLabs: Aion-1.0", "modalities": { "input": [ "text" @@ -87892,19 +98903,20 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 131072, + "output": 32768 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "google/gemma-3n-e4b-it", - "name": "Google: Gemma 3n 4B", - "display_name": "Google: Gemma 3n 4B", + "id": "aion-labs/aion-1.0-mini", + "name": "AionLabs: Aion-1.0-Mini", + "display_name": "AionLabs: Aion-1.0-Mini", "modalities": { "input": [ "text" @@ -87914,19 +98926,20 @@ ] }, "limit": { - "context": 32768, + "context": 131072, "output": 32768 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "google/gemma-3n-e4b-it:free", - "name": "Google: Gemma 3n 4B (free)", - "display_name": "Google: Gemma 3n 4B (free)", + "id": "aion-labs/aion-rp-llama-3.1-8b", + "name": "AionLabs: Aion-RP 1.0 (8B)", + "display_name": "AionLabs: Aion-RP 1.0 (8B)", "modalities": { "input": [ "text" @@ -87936,8 +98949,8 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 32768, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -87946,9 +98959,9 @@ "type": "chat" }, { - "id": "gryphe/mythomax-l2-13b", - "name": "MythoMax 13B", - "display_name": "MythoMax 13B", + "id": "alfredpros/codellama-7b-instruct-solidity", + "name": "AlfredPros: CodeLLaMa 7B Instruct Solidity", + "display_name": "AlfredPros: CodeLLaMa 7B Instruct Solidity", "modalities": { "input": [ "text" @@ -87968,9 +98981,9 @@ "type": "chat" }, { - "id": "ibm-granite/granite-4.0-h-micro", - "name": "IBM: Granite 4.0 Micro", - "display_name": "IBM: Granite 4.0 Micro", + "id": "alibaba/tongyi-deepresearch-30b-a3b", + "name": "Tongyi DeepResearch 30B A3B", + "display_name": "Tongyi DeepResearch 30B A3B", "modalities": { "input": [ "text" @@ -87980,42 +98993,44 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 131072, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "inception/mercury", - "name": "Inception: Mercury", - "display_name": "Inception: Mercury", + "id": "allenai/molmo-2-8b", + "name": "AllenAI: Molmo2 8B", + "display_name": "AllenAI: Molmo2 8B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 36864, + "output": 36864 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "inception/mercury-coder", - "name": "Inception: Mercury Coder", - "display_name": "Inception: Mercury Coder", + "id": "allenai/olmo-2-0325-32b-instruct", + "name": "AllenAI: Olmo 2 32B Instruct", + "display_name": "AllenAI: Olmo 2 32B Instruct", "modalities": { "input": [ "text" @@ -88026,19 +99041,18 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 128000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "inflection/inflection-3-pi", - "name": "Inflection: Inflection 3 Pi", - "display_name": "Inflection: Inflection 3 Pi", + "id": "allenai/olmo-3-32b-think", + "name": "AllenAI: Olmo 3 32B Think", + "display_name": "AllenAI: Olmo 3 32B Think", "modalities": { "input": [ "text" @@ -88048,19 +99062,21 @@ ] }, "limit": { - "context": 8000, - "output": 1024 + "context": 65536, + "output": 65536 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "inflection/inflection-3-productivity", - "name": "Inflection: Inflection 3 Productivity", - "display_name": "Inflection: Inflection 3 Productivity", + "id": "allenai/olmo-3-7b-instruct", + "name": "AllenAI: Olmo 3 7B Instruct", + "display_name": "AllenAI: Olmo 3 7B Instruct", "modalities": { "input": [ "text" @@ -88070,9 +99086,10 @@ ] }, "limit": { - "context": 8000, - "output": 1024 + "context": 65536, + "output": 65536 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false @@ -88080,9 +99097,9 @@ "type": "chat" }, { - "id": "kwaipilot/kat-coder-pro", - "name": "Kwaipilot: KAT-Coder-Pro V1", - "display_name": "Kwaipilot: KAT-Coder-Pro V1", + "id": "allenai/olmo-3-7b-think", + "name": "AllenAI: Olmo 3 7B Think", + "display_name": "AllenAI: Olmo 3 7B Think", "modalities": { "input": [ "text" @@ -88092,19 +99109,21 @@ ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 65536, + "output": 65536 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "kwaipilot/kat-coder-pro:free", - "name": "Kwaipilot: KAT-Coder-Pro V1 (free)", - "display_name": "Kwaipilot: KAT-Coder-Pro V1 (free)", + "id": "allenai/olmo-3.1-32b-instruct", + "name": "AllenAI: Olmo 3.1 32B Instruct", + "display_name": "AllenAI: Olmo 3.1 32B Instruct", "modalities": { "input": [ "text" @@ -88114,9 +99133,10 @@ ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 65536, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false @@ -88124,9 +99144,9 @@ "type": "chat" }, { - "id": "liquid/lfm-2.2-6b", - "name": "LiquidAI/LFM2-2.6B", - "display_name": "LiquidAI/LFM2-2.6B", + "id": "allenai/olmo-3.1-32b-think", + "name": "AllenAI: Olmo 3.1 32B Think", + "display_name": "AllenAI: Olmo 3.1 32B Think", "modalities": { "input": [ "text" @@ -88136,19 +99156,21 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 65536, + "output": 65536 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "liquid/lfm2-8b-a1b", - "name": "LiquidAI/LFM2-8B-A1B", - "display_name": "LiquidAI/LFM2-8B-A1B", + "id": "alpindale/goliath-120b", + "name": "Goliath 120B", + "display_name": "Goliath 120B", "modalities": { "input": [ "text" @@ -88158,8 +99180,8 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 6144, + "output": 1024 }, "tool_call": false, "reasoning": { @@ -88168,53 +99190,58 @@ "type": "chat" }, { - "id": "mancer/weaver", - "name": "Mancer: Weaver (alpha)", - "display_name": "Mancer: Weaver (alpha)", + "id": "amazon/nova-2-lite-v1", + "name": "Amazon: Nova 2 Lite", + "display_name": "Amazon: Nova 2 Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 8000, - "output": 2000 + "context": 1000000, + "output": 65535 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "meituan/longcat-flash-chat", - "name": "Meituan: LongCat Flash Chat", - "display_name": "Meituan: LongCat Flash Chat", + "id": "amazon/nova-lite-v1", + "name": "Amazon: Nova Lite 1.0", + "display_name": "Amazon: Nova Lite 1.0", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 300000, + "output": 5120 }, "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "meta-llama/llama-3-70b-instruct", - "name": "Meta: Llama 3 70B Instruct", - "display_name": "Meta: Llama 3 70B Instruct", + "id": "amazon/nova-micro-v1", + "name": "Amazon: Nova Micro 1.0", + "display_name": "Amazon: Nova Micro 1.0", "modalities": { "input": [ "text" @@ -88224,63 +99251,65 @@ ] }, "limit": { - "context": 8192, - "output": 16384 + "context": 128000, + "output": 5120 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "meta-llama/llama-3-8b-instruct", - "name": "Meta: Llama 3 8B Instruct", - "display_name": "Meta: Llama 3 8B Instruct", + "id": "amazon/nova-premier-v1", + "name": "Amazon: Nova Premier 1.0", + "display_name": "Amazon: Nova Premier 1.0", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 16384 + "context": 1000000, + "output": 32000 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "meta-llama/llama-3.1-405b", - "name": "Meta: Llama 3.1 405B (base)", - "display_name": "Meta: Llama 3.1 405B (base)", + "id": "amazon/nova-pro-v1", + "name": "Amazon: Nova Pro 1.0", + "display_name": "Amazon: Nova Pro 1.0", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 300000, + "output": 5120 }, "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "meta-llama/llama-3.1-405b-instruct", - "name": "Meta: Llama 3.1 405B Instruct", - "display_name": "Meta: Llama 3.1 405B Instruct", + "id": "anthracite-org/magnum-v4-72b", + "name": "Magnum v4 72B", + "display_name": "Magnum v4 72B", "modalities": { "input": [ "text" @@ -88290,85 +99319,89 @@ ] }, "limit": { - "context": 10000, - "output": 10000 + "context": 16384, + "output": 2048 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "meta-llama/llama-3.1-405b-instruct:free", - "name": "Meta: Llama 3.1 405B Instruct (free)", - "display_name": "Meta: Llama 3.1 405B Instruct (free)", + "id": "anthropic/claude-3-haiku", + "name": "Anthropic: Claude 3 Haiku", + "display_name": "Anthropic: Claude 3 Haiku", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 4096 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "meta-llama/llama-3.1-70b-instruct", - "name": "Meta: Llama 3.1 70B Instruct", - "display_name": "Meta: Llama 3.1 70B Instruct", + "id": "anthropic/claude-3.5-haiku", + "name": "Anthropic: Claude 3.5 Haiku", + "display_name": "Anthropic: Claude 3.5 Haiku", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 8192 }, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "meta-llama/llama-3.1-8b-instruct", - "name": "Meta: Llama 3.1 8B Instruct", - "display_name": "Meta: Llama 3.1 8B Instruct", + "id": "anthropic/claude-3.5-sonnet", + "name": "Anthropic: Claude 3.5 Sonnet", + "display_name": "Anthropic: Claude 3.5 Sonnet", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 200000, + "output": 8192 }, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, - { - "id": "meta-llama/llama-3.2-11b-vision-instruct", - "name": "Meta: Llama 3.2 11B Vision Instruct", - "display_name": "Meta: Llama 3.2 11B Vision Instruct", + { + "id": "anthropic/claude-3.7-sonnet", + "name": "Anthropic: Claude 3.7 Sonnet", + "display_name": "Anthropic: Claude 3.7 Sonnet", "modalities": { "input": [ "text", @@ -88379,43 +99412,49 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 200000, + "output": 64000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, + "attachment": true, "type": "imageGeneration" }, { - "id": "meta-llama/llama-3.2-1b-instruct", - "name": "Meta: Llama 3.2 1B Instruct", - "display_name": "Meta: Llama 3.2 1B Instruct", + "id": "anthropic/claude-3.7-sonnet:thinking", + "name": "Anthropic: Claude 3.7 Sonnet (thinking)", + "display_name": "Anthropic: Claude 3.7 Sonnet (thinking)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 60000, - "output": 60000 + "context": 200000, + "output": 64000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "meta-llama/llama-3.2-3b-instruct", - "name": "Meta: Llama 3.2 3B Instruct", - "display_name": "Meta: Llama 3.2 3B Instruct", + "id": "anthropic/claude-haiku-4.5", + "name": "Anthropic: Claude Haiku 4.5", + "display_name": "Anthropic: Claude Haiku 4.5", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -88423,21 +99462,23 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 200000, + "output": 64000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "meta-llama/llama-3.2-3b-instruct:free", - "name": "Meta: Llama 3.2 3B Instruct (free)", - "display_name": "Meta: Llama 3.2 3B Instruct (free)", + "id": "anthropic/claude-opus-4", + "name": "Anthropic: Claude Opus 4", + "display_name": "Anthropic: Claude Opus 4", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -88445,44 +99486,49 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "meta-llama/llama-3.2-90b-vision-instruct", - "name": "Meta: Llama 3.2 90B Vision Instruct", - "display_name": "Meta: Llama 3.2 90B Vision Instruct", + "id": "anthropic/claude-opus-4.1", + "name": "Anthropic: Claude Opus 4.1", + "display_name": "Anthropic: Claude Opus 4.1", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, + "attachment": true, "type": "imageGeneration" }, { - "id": "meta-llama/llama-3.3-70b-instruct", - "name": "Meta: Llama 3.3 70B Instruct", - "display_name": "Meta: Llama 3.3 70B Instruct", + "id": "anthropic/claude-opus-4.5", + "name": "Anthropic: Claude Opus 4.5", + "display_name": "Anthropic: Claude Opus 4.5", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -88490,64 +99536,70 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 200000, + "output": 64000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "meta-llama/llama-3.3-70b-instruct:free", - "name": "Meta: Llama 3.3 70B Instruct (free)", - "display_name": "Meta: Llama 3.3 70B Instruct (free)", + "id": "anthropic/claude-opus-4.6", + "name": "Anthropic: Claude Opus 4.6", + "display_name": "Anthropic: Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1000000, + "output": 128000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "meta-llama/llama-4-maverick", - "name": "Meta: Llama 4 Maverick", - "display_name": "Meta: Llama 4 Maverick", + "id": "anthropic/claude-sonnet-4", + "name": "Anthropic: Claude Sonnet 4", + "display_name": "Anthropic: Claude Sonnet 4", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 16384 + "context": 1000000, + "output": 64000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, + "attachment": true, "type": "imageGeneration" }, { - "id": "meta-llama/llama-4-scout", - "name": "Meta: Llama 4 Scout", - "display_name": "Meta: Llama 4 Scout", + "id": "anthropic/claude-sonnet-4.5", + "name": "Anthropic: Claude Sonnet 4.5", + "display_name": "Anthropic: Claude Sonnet 4.5", "modalities": { "input": [ "text", @@ -88558,19 +99610,22 @@ ] }, "limit": { - "context": 327680, - "output": 16384 + "context": 1000000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, + "attachment": true, "type": "imageGeneration" }, { - "id": "meta-llama/llama-guard-2-8b", - "name": "Meta: LlamaGuard 2 8B", - "display_name": "Meta: LlamaGuard 2 8B", + "id": "arcee-ai/coder-large", + "name": "Arcee AI: Coder Large", + "display_name": "Arcee AI: Coder Large", "modalities": { "input": [ "text" @@ -88580,8 +99635,8 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 32768, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -88590,9 +99645,9 @@ "type": "chat" }, { - "id": "meta-llama/llama-guard-3-8b", - "name": "Llama Guard 3 8B", - "display_name": "Llama Guard 3 8B", + "id": "arcee-ai/maestro-reasoning", + "name": "Arcee AI: Maestro Reasoning", + "display_name": "Arcee AI: Maestro Reasoning", "modalities": { "input": [ "text" @@ -88603,7 +99658,7 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 32000 }, "tool_call": false, "reasoning": { @@ -88612,9 +99667,9 @@ "type": "chat" }, { - "id": "meta-llama/llama-guard-4-12b", - "name": "Meta: Llama Guard 4 12B", - "display_name": "Meta: Llama Guard 4 12B", + "id": "arcee-ai/spotlight", + "name": "Arcee AI: Spotlight", + "display_name": "Arcee AI: Spotlight", "modalities": { "input": [ "image", @@ -88625,8 +99680,8 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 131072, + "output": 65537 }, "tool_call": false, "reasoning": { @@ -88635,9 +99690,9 @@ "type": "imageGeneration" }, { - "id": "microsoft/phi-4", - "name": "Microsoft: Phi 4", - "display_name": "Microsoft: Phi 4", + "id": "arcee-ai/trinity-large-preview:free", + "name": "Arcee AI: Trinity Large Preview (free)", + "display_name": "Arcee AI: Trinity Large Preview (free)", "modalities": { "input": [ "text" @@ -88647,9 +99702,10 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 131000, + "output": 131000 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false @@ -88657,13 +99713,12 @@ "type": "chat" }, { - "id": "microsoft/phi-4-multimodal-instruct", - "name": "Microsoft: Phi 4 Multimodal Instruct", - "display_name": "Microsoft: Phi 4 Multimodal Instruct", + "id": "arcee-ai/trinity-mini", + "name": "Arcee AI: Trinity Mini", + "display_name": "Arcee AI: Trinity Mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -88673,16 +99728,18 @@ "context": 131072, "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "microsoft/phi-4-reasoning-plus", - "name": "Microsoft: Phi 4 Reasoning Plus", - "display_name": "Microsoft: Phi 4 Reasoning Plus", + "id": "arcee-ai/trinity-mini:free", + "name": "Arcee AI: Trinity Mini (free)", + "display_name": "Arcee AI: Trinity Mini (free)", "modalities": { "input": [ "text" @@ -88692,10 +99749,11 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 131072, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -88703,9 +99761,9 @@ "type": "chat" }, { - "id": "microsoft/wizardlm-2-8x22b", - "name": "WizardLM-2 8x22B", - "display_name": "WizardLM-2 8x22B", + "id": "arcee-ai/virtuoso-large", + "name": "Arcee AI: Virtuoso Large", + "display_name": "Arcee AI: Virtuoso Large", "modalities": { "input": [ "text" @@ -88715,42 +99773,19 @@ ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 131072, + "output": 64000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "minimax/minimax-01", - "name": "MiniMax: MiniMax-01", - "display_name": "MiniMax: MiniMax-01", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000192, - "output": 1000192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "type": "imageGeneration" - }, - { - "id": "minimax/minimax-m1", - "name": "MiniMax: MiniMax M1", - "display_name": "MiniMax: MiniMax M1", + "id": "baidu/ernie-4.5-21b-a3b", + "name": "Baidu: ERNIE 4.5 21B A3B", + "display_name": "Baidu: ERNIE 4.5 21B A3B", "modalities": { "input": [ "text" @@ -88760,20 +99795,20 @@ ] }, "limit": { - "context": 1000000, - "output": 40000 + "context": 120000, + "output": 8000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "minimax/minimax-m2", - "name": "MiniMax: MiniMax M2", - "display_name": "MiniMax: MiniMax M2", + "id": "baidu/ernie-4.5-21b-a3b-thinking", + "name": "Baidu: ERNIE 4.5 21B A3B Thinking", + "display_name": "Baidu: ERNIE 4.5 21B A3B Thinking", "modalities": { "input": [ "text" @@ -88783,11 +99818,11 @@ ] }, "limit": { - "context": 196608, + "context": 131072, "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -88795,9 +99830,9 @@ "type": "chat" }, { - "id": "minimax/minimax-m2.1", - "name": "MiniMax: MiniMax M2.1", - "display_name": "MiniMax: MiniMax M2.1", + "id": "baidu/ernie-4.5-300b-a47b", + "name": "Baidu: ERNIE 4.5 300B A47B", + "display_name": "Baidu: ERNIE 4.5 300B A47B", "modalities": { "input": [ "text" @@ -88807,46 +99842,46 @@ ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 123000, + "output": 12000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "mistralai/codestral-2508", - "name": "Mistral: Codestral 2508", - "display_name": "Mistral: Codestral 2508", + "id": "baidu/ernie-4.5-vl-28b-a3b", + "name": "Baidu: ERNIE 4.5 VL 28B A3B", + "display_name": "Baidu: ERNIE 4.5 VL 28B A3B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 30000, + "output": 8000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "mistralai/devstral-2512", - "name": "Mistral: Devstral 2 2512", - "display_name": "Mistral: Devstral 2 2512", + "id": "baidu/ernie-4.5-vl-424b-a47b", + "name": "Baidu: ERNIE 4.5 VL 424B A47B", + "display_name": "Baidu: ERNIE 4.5 VL 424B A47B", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -88854,23 +99889,25 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 123000, + "output": 16000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "mistralai/devstral-2512:free", - "name": "Mistral: Devstral 2 2512 (free)", - "display_name": "Mistral: Devstral 2 2512 (free)", + "id": "bytedance-seed/seed-1.6", + "name": "ByteDance Seed: Seed 1.6", + "display_name": "ByteDance Seed: Seed 1.6", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" @@ -88878,44 +99915,47 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 32768 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "mistralai/devstral-medium", - "name": "Mistral: Devstral Medium", - "display_name": "Mistral: Devstral Medium", + "id": "bytedance-seed/seed-1.6-flash", + "name": "ByteDance Seed: Seed 1.6 Flash", + "display_name": "ByteDance Seed: Seed 1.6 Flash", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 32768 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "mistralai/devstral-small", - "name": "Mistral: Devstral Small 1.1", - "display_name": "Mistral: Devstral Small 1.1", + "id": "bytedance/ui-tars-1.5-7b", + "name": "ByteDance: UI-TARS 7B", + "display_name": "ByteDance: UI-TARS 7B", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -88924,19 +99964,18 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 2048 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "mistralai/devstral-small-2505", - "name": "Mistral: Devstral Small 2505", - "display_name": "Mistral: Devstral Small 2505", + "id": "cognitivecomputations/dolphin-mistral-24b-venice-edition:free", + "name": "Venice: Uncensored (free)", + "display_name": "Venice: Uncensored (free)", "modalities": { "input": [ "text" @@ -88946,10 +99985,9 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 32768, + "output": 32768 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false @@ -88957,33 +99995,31 @@ "type": "chat" }, { - "id": "mistralai/ministral-14b-2512", - "name": "Mistral: Ministral 3 14B 2512", - "display_name": "Mistral: Ministral 3 14B 2512", + "id": "cohere/command-a", + "name": "Cohere: Command A", + "display_name": "Cohere: Command A", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "mistralai/ministral-3b", - "name": "Mistral: Ministral 3B", - "display_name": "Mistral: Ministral 3B", + "id": "cohere/command-r-08-2024", + "name": "Cohere: Command R (08-2024)", + "display_name": "Cohere: Command R (08-2024)", "modalities": { "input": [ "text" @@ -88993,10 +100029,9 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 4000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false @@ -89004,33 +100039,31 @@ "type": "chat" }, { - "id": "mistralai/ministral-3b-2512", - "name": "Mistral: Ministral 3 3B 2512", - "display_name": "Mistral: Ministral 3 3B 2512", + "id": "cohere/command-r-plus-08-2024", + "name": "Cohere: Command R+ (08-2024)", + "display_name": "Cohere: Command R+ (08-2024)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 4000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "mistralai/ministral-8b", - "name": "Mistral: Ministral 8B", - "display_name": "Mistral: Ministral 8B", + "id": "cohere/command-r7b-12-2024", + "name": "Cohere: Command R7B (12-2024)", + "display_name": "Cohere: Command R7B (12-2024)", "modalities": { "input": [ "text" @@ -89040,44 +100073,42 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 4000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "mistralai/ministral-8b-2512", - "name": "Mistral: Ministral 3 8B 2512", - "display_name": "Mistral: Ministral 3 8B 2512", + "id": "deepcogito/cogito-v2.1-671b", + "name": "Deep Cogito: Cogito v2.1 671B", + "display_name": "Deep Cogito: Cogito v2.1 671B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 128000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "mistralai/mistral-7b-instruct", - "name": "Mistral: Mistral 7B Instruct", - "display_name": "Mistral: Mistral 7B Instruct", + "id": "deepseek/deepseek-chat", + "name": "DeepSeek: DeepSeek V3", + "display_name": "DeepSeek: DeepSeek V3", "modalities": { "input": [ "text" @@ -89087,10 +100118,9 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 163840, + "output": 163840 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false @@ -89098,9 +100128,9 @@ "type": "chat" }, { - "id": "mistralai/mistral-7b-instruct-v0.1", - "name": "Mistral: Mistral 7B Instruct v0.1", - "display_name": "Mistral: Mistral 7B Instruct v0.1", + "id": "deepseek/deepseek-chat-v3-0324", + "name": "DeepSeek: DeepSeek V3 0324", + "display_name": "DeepSeek: DeepSeek V3 0324", "modalities": { "input": [ "text" @@ -89110,20 +100140,20 @@ ] }, "limit": { - "context": 2824, - "output": 2824 + "context": 163840, + "output": 65536 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "mistralai/mistral-7b-instruct-v0.2", - "name": "Mistral: Mistral 7B Instruct v0.2", - "display_name": "Mistral: Mistral 7B Instruct v0.2", + "id": "deepseek/deepseek-chat-v3.1", + "name": "DeepSeek: DeepSeek V3.1", + "display_name": "DeepSeek: DeepSeek V3.1", "modalities": { "input": [ "text" @@ -89134,19 +100164,19 @@ }, "limit": { "context": 32768, - "output": 32768 + "output": 7168 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "mistralai/mistral-7b-instruct-v0.3", - "name": "Mistral: Mistral 7B Instruct v0.3", - "display_name": "Mistral: Mistral 7B Instruct v0.3", + "id": "deepseek/deepseek-r1", + "name": "DeepSeek: R1", + "display_name": "DeepSeek: R1", "modalities": { "input": [ "text" @@ -89156,20 +100186,20 @@ ] }, "limit": { - "context": 32768, - "output": 4096 + "context": 64000, + "output": 16000 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "mistralai/mistral-7b-instruct:free", - "name": "Mistral: Mistral 7B Instruct (free)", - "display_name": "Mistral: Mistral 7B Instruct (free)", + "id": "deepseek/deepseek-r1-0528", + "name": "DeepSeek: R1 0528", + "display_name": "DeepSeek: R1 0528", "modalities": { "input": [ "text" @@ -89179,20 +100209,20 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 163840, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "mistralai/mistral-large", - "name": "Mistral Large", - "display_name": "Mistral Large", + "id": "deepseek/deepseek-r1-0528:free", + "name": "DeepSeek: R1 0528 (free)", + "display_name": "DeepSeek: R1 0528 (free)", "modalities": { "input": [ "text" @@ -89202,20 +100232,20 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 163840, + "output": 163840 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "mistralai/mistral-large-2407", - "name": "Mistral Large 2407", - "display_name": "Mistral Large 2407", + "id": "deepseek/deepseek-r1-distill-llama-70b", + "name": "DeepSeek: R1 Distill Llama 70B", + "display_name": "DeepSeek: R1 Distill Llama 70B", "modalities": { "input": [ "text" @@ -89228,17 +100258,17 @@ "context": 131072, "output": 131072 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "mistralai/mistral-large-2411", - "name": "Mistral Large 2411", - "display_name": "Mistral Large 2411", + "id": "deepseek/deepseek-r1-distill-qwen-32b", + "name": "DeepSeek: R1 Distill Qwen 32B", + "display_name": "DeepSeek: R1 Distill Qwen 32B", "modalities": { "input": [ "text" @@ -89248,92 +100278,90 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 32768, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "mistralai/mistral-large-2512", - "name": "Mistral: Mistral Large 3 2512", - "display_name": "Mistral: Mistral Large 3 2512", + "id": "deepseek/deepseek-v3.1-terminus", + "name": "DeepSeek: DeepSeek V3.1 Terminus", + "display_name": "DeepSeek: DeepSeek V3.1 Terminus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 163840, + "output": 163840 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "mistralai/mistral-medium-3", - "name": "Mistral: Mistral Medium 3", - "display_name": "Mistral: Mistral Medium 3", + "id": "deepseek/deepseek-v3.1-terminus:exacto", + "name": "DeepSeek: DeepSeek V3.1 Terminus (exacto)", + "display_name": "DeepSeek: DeepSeek V3.1 Terminus (exacto)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 163840, + "output": 163840 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "mistralai/mistral-medium-3.1", - "name": "Mistral: Mistral Medium 3.1", - "display_name": "Mistral: Mistral Medium 3.1", + "id": "deepseek/deepseek-v3.2", + "name": "DeepSeek: DeepSeek V3.2", + "display_name": "DeepSeek: DeepSeek V3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "mistralai/mistral-nemo", - "name": "Mistral: Mistral Nemo", - "display_name": "Mistral: Mistral Nemo", + "id": "deepseek/deepseek-v3.2-exp", + "name": "DeepSeek: DeepSeek V3.2 Exp", + "display_name": "DeepSeek: DeepSeek V3.2 Exp", "modalities": { "input": [ "text" @@ -89343,20 +100371,21 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "mistralai/mistral-saba", - "name": "Mistral: Saba", - "display_name": "Mistral: Saba", + "id": "deepseek/deepseek-v3.2-speciale", + "name": "DeepSeek: DeepSeek V3.2 Speciale", + "display_name": "DeepSeek: DeepSeek V3.2 Speciale", "modalities": { "input": [ "text" @@ -89366,20 +100395,21 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 163840, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "mistralai/mistral-small-24b-instruct-2501", - "name": "Mistral: Mistral Small 3", - "display_name": "Mistral: Mistral Small 3", + "id": "eleutherai/llemma_7b", + "name": "EleutherAI: Llemma 7b", + "display_name": "EleutherAI: Llemma 7b", "modalities": { "input": [ "text" @@ -89389,120 +100419,127 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 4096, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "mistralai/mistral-small-3.1-24b-instruct", - "name": "Mistral: Mistral Small 3.1 24B", - "display_name": "Mistral: Mistral Small 3.1 24B", + "id": "essentialai/rnj-1-instruct", + "name": "EssentialAI: Rnj 1 Instruct", + "display_name": "EssentialAI: Rnj 1 Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 32768, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "mistralai/mistral-small-3.1-24b-instruct:free", - "name": "Mistral: Mistral Small 3.1 24B (free)", - "display_name": "Mistral: Mistral Small 3.1 24B (free)", + "id": "google/gemini-2.0-flash-001", + "name": "Google: Gemini 2.0 Flash", + "display_name": "Google: Gemini 2.0 Flash", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 1048576, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "attachment": true, "type": "imageGeneration" }, { - "id": "mistralai/mistral-small-3.2-24b-instruct", - "name": "Mistral: Mistral Small 3.2 24B", - "display_name": "Mistral: Mistral Small 3.2 24B", + "id": "google/gemini-2.0-flash-lite-001", + "name": "Google: Gemini 2.0 Flash Lite", + "display_name": "Google: Gemini 2.0 Flash Lite", "modalities": { "input": [ + "text", "image", - "text" + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1048576, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "attachment": true, "type": "imageGeneration" }, { - "id": "mistralai/mistral-small-creative", - "name": "Mistral: Mistral Small Creative", - "display_name": "Mistral: Mistral Small Creative", + "id": "google/gemini-2.5-flash", + "name": "Google: Gemini 2.5 Flash", + "display_name": "Google: Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "image", + "text", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 1048576, + "output": 65535 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "mistralai/mistral-tiny", - "name": "Mistral Tiny", - "display_name": "Mistral Tiny", + "id": "google/gemini-2.5-flash-image", + "name": "Google: Gemini 2.5 Flash Image (Nano Banana)", + "display_name": "Google: Gemini 2.5 Flash Image (Nano Banana)", "modalities": { "input": [ + "image", "text" ], "output": [ + "image", "text" ] }, @@ -89510,113 +100547,127 @@ "context": 32768, "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "mistralai/mixtral-8x22b-instruct", - "name": "Mistral: Mixtral 8x22B Instruct", - "display_name": "Mistral: Mixtral 8x22B Instruct", + "id": "google/gemini-2.5-flash-lite", + "name": "Google: Gemini 2.5 Flash Lite", + "display_name": "Google: Gemini 2.5 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 1048576, + "output": 65535 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "mistralai/mixtral-8x7b-instruct", - "name": "Mistral: Mixtral 8x7B Instruct", - "display_name": "Mistral: Mixtral 8x7B Instruct", + "id": "google/gemini-2.5-flash-lite-preview-09-2025", + "name": "Google: Gemini 2.5 Flash Lite Preview 09-2025", + "display_name": "Google: Gemini 2.5 Flash Lite Preview 09-2025", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 1048576, + "output": 65535 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "mistralai/pixtral-12b", - "name": "Mistral: Pixtral 12B", - "display_name": "Mistral: Pixtral 12B", + "id": "google/gemini-2.5-flash-preview-09-2025", + "name": "Google: Gemini 2.5 Flash Preview 09-2025", + "display_name": "Google: Gemini 2.5 Flash Preview 09-2025", "modalities": { "input": [ + "image", "text", - "image" + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 1048576, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, + "attachment": true, "type": "imageGeneration" }, { - "id": "mistralai/pixtral-large-2411", - "name": "Mistral: Pixtral Large 2411", - "display_name": "Mistral: Pixtral Large 2411", + "id": "google/gemini-2.5-pro", + "name": "Google: Gemini 2.5 Pro", + "display_name": "Google: Gemini 2.5 Pro", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1048576, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, + "attachment": true, "type": "imageGeneration" }, { - "id": "mistralai/voxtral-small-24b-2507", - "name": "Mistral: Voxtral Small 24B 2507", - "display_name": "Mistral: Voxtral Small 24B 2507", + "id": "google/gemini-2.5-pro-preview", + "name": "Google: Gemini 2.5 Pro Preview 06-05", + "display_name": "Google: Gemini 2.5 Pro Preview 06-05", "modalities": { "input": [ + "image", "text", "audio" ], @@ -89625,109 +100676,127 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 1048576, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "moonshotai/kimi-dev-72b", - "name": "MoonshotAI: Kimi Dev 72B", - "display_name": "MoonshotAI: Kimi Dev 72B", + "id": "google/gemini-2.5-pro-preview-05-06", + "name": "Google: Gemini 2.5 Pro Preview 05-06", + "display_name": "Google: Gemini 2.5 Pro Preview 05-06", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1048576, + "output": 65535 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "moonshotai/kimi-k2", - "name": "MoonshotAI: Kimi K2 0711", - "display_name": "MoonshotAI: Kimi K2 0711", + "id": "google/gemini-3-flash-preview", + "name": "Google: Gemini 3 Flash Preview", + "display_name": "Google: Gemini 3 Flash Preview", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1048576, + "output": 65535 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "moonshotai/kimi-k2-0905", - "name": "MoonshotAI: Kimi K2 0905", - "display_name": "MoonshotAI: Kimi K2 0905", + "id": "google/gemini-3-pro-image-preview", + "name": "Google: Nano Banana Pro (Gemini 3 Pro Image Preview)", + "display_name": "Google: Nano Banana Pro (Gemini 3 Pro Image Preview)", "modalities": { "input": [ + "image", "text" ], "output": [ + "image", "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 65536, + "output": 32768 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "moonshotai/kimi-k2-0905:exacto", - "name": "MoonshotAI: Kimi K2 0905 (exacto)", - "display_name": "MoonshotAI: Kimi K2 0905 (exacto)", + "id": "google/gemini-3-pro-preview", + "name": "Google: Gemini 3 Pro Preview", + "display_name": "Google: Gemini 3 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 65536 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "moonshotai/kimi-k2-thinking", - "name": "MoonshotAI: Kimi K2 Thinking", - "display_name": "MoonshotAI: Kimi K2 Thinking", + "id": "google/gemma-2-27b-it", + "name": "Google: Gemma 2 27B", + "display_name": "Google: Gemma 2 27B", "modalities": { "input": [ "text" @@ -89737,20 +100806,19 @@ ] }, "limit": { - "context": 262144, - "output": 65535 + "context": 8192, + "output": 2048 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "moonshotai/kimi-k2:free", - "name": "MoonshotAI: Kimi K2 0711 (free)", - "display_name": "MoonshotAI: Kimi K2 0711 (free)", + "id": "google/gemma-2-9b-it", + "name": "Google: Gemma 2 9B", + "display_name": "Google: Gemma 2 9B", "modalities": { "input": [ "text" @@ -89760,8 +100828,8 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -89770,122 +100838,128 @@ "type": "chat" }, { - "id": "morph/morph-v3-fast", - "name": "Morph: Morph V3 Fast", - "display_name": "Morph: Morph V3 Fast", + "id": "google/gemma-3-12b-it", + "name": "Google: Gemma 3 12B", + "display_name": "Google: Gemma 3 12B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 81920, - "output": 38000 + "context": 131072, + "output": 131072 }, "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "morph/morph-v3-large", - "name": "Morph: Morph V3 Large", - "display_name": "Morph: Morph V3 Large", + "id": "google/gemma-3-12b-it:free", + "name": "Google: Gemma 3 12B (free)", + "display_name": "Google: Gemma 3 12B (free)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 32768, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "neversleep/llama-3.1-lumimaid-8b", - "name": "NeverSleep: Lumimaid v0.2 8B", - "display_name": "NeverSleep: Lumimaid v0.2 8B", + "id": "google/gemma-3-27b-it", + "name": "Google: Gemma 3 27B", + "display_name": "Google: Gemma 3 27B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "neversleep/noromaid-20b", - "name": "Noromaid 20B", - "display_name": "Noromaid 20B", + "id": "google/gemma-3-27b-it:free", + "name": "Google: Gemma 3 27B (free)", + "display_name": "Google: Gemma 3 27B (free)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 131072, + "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "nex-agi/deepseek-v3.1-nex-n1:free", - "name": "Nex AGI: DeepSeek V3.1 Nex N1 (free)", - "display_name": "Nex AGI: DeepSeek V3.1 Nex N1 (free)", + "id": "google/gemma-3-4b-it", + "name": "Google: Gemma 3 4B", + "display_name": "Google: Gemma 3 4B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 163840 + "context": 96000, + "output": 96000 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "nousresearch/deephermes-3-mistral-24b-preview", - "name": "Nous: DeepHermes 3 Mistral 24B Preview", - "display_name": "Nous: DeepHermes 3 Mistral 24B Preview", + "id": "google/gemma-3-4b-it:free", + "name": "Google: Gemma 3 4B (free)", + "display_name": "Google: Gemma 3 4B (free)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -89893,19 +100967,18 @@ }, "limit": { "context": 32768, - "output": 32768 + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "nousresearch/hermes-2-pro-llama-3-8b", - "name": "NousResearch: Hermes 2 Pro - Llama-3 8B", - "display_name": "NousResearch: Hermes 2 Pro - Llama-3 8B", + "id": "google/gemma-3n-e2b-it:free", + "name": "Google: Gemma 3n 2B (free)", + "display_name": "Google: Gemma 3n 2B (free)", "modalities": { "input": [ "text" @@ -89925,9 +100998,9 @@ "type": "chat" }, { - "id": "nousresearch/hermes-3-llama-3.1-405b", - "name": "Nous: Hermes 3 405B Instruct", - "display_name": "Nous: Hermes 3 405B Instruct", + "id": "google/gemma-3n-e4b-it", + "name": "Google: Gemma 3n 4B", + "display_name": "Google: Gemma 3n 4B", "modalities": { "input": [ "text" @@ -89937,8 +101010,8 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 32768, + "output": 32768 }, "tool_call": false, "reasoning": { @@ -89947,9 +101020,9 @@ "type": "chat" }, { - "id": "nousresearch/hermes-3-llama-3.1-405b:free", - "name": "Nous: Hermes 3 405B Instruct (free)", - "display_name": "Nous: Hermes 3 405B Instruct (free)", + "id": "google/gemma-3n-e4b-it:free", + "name": "Google: Gemma 3n 4B (free)", + "display_name": "Google: Gemma 3n 4B (free)", "modalities": { "input": [ "text" @@ -89959,8 +101032,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 8192, + "output": 2048 }, "tool_call": false, "reasoning": { @@ -89969,9 +101042,9 @@ "type": "chat" }, { - "id": "nousresearch/hermes-3-llama-3.1-70b", - "name": "Nous: Hermes 3 70B Instruct", - "display_name": "Nous: Hermes 3 70B Instruct", + "id": "gryphe/mythomax-l2-13b", + "name": "MythoMax 13B", + "display_name": "MythoMax 13B", "modalities": { "input": [ "text" @@ -89981,8 +101054,8 @@ ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 4096, + "output": 4096 }, "tool_call": false, "reasoning": { @@ -89991,9 +101064,9 @@ "type": "chat" }, { - "id": "nousresearch/hermes-4-405b", - "name": "Nous: Hermes 4 405B", - "display_name": "Nous: Hermes 4 405B", + "id": "ibm-granite/granite-4.0-h-micro", + "name": "IBM: Granite 4.0 Micro", + "display_name": "IBM: Granite 4.0 Micro", "modalities": { "input": [ "text" @@ -90003,20 +101076,19 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 131000, + "output": 131000 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "nousresearch/hermes-4-70b", - "name": "Nous: Hermes 4 70B", - "display_name": "Nous: Hermes 4 70B", + "id": "inception/mercury", + "name": "Inception: Mercury", + "display_name": "Inception: Mercury", "modalities": { "input": [ "text" @@ -90026,20 +101098,20 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "nvidia/llama-3.1-nemotron-70b-instruct", - "name": "NVIDIA: Llama 3.1 Nemotron 70B Instruct", - "display_name": "NVIDIA: Llama 3.1 Nemotron 70B Instruct", + "id": "inception/mercury-coder", + "name": "Inception: Mercury Coder", + "display_name": "Inception: Mercury Coder", "modalities": { "input": [ "text" @@ -90049,9 +101121,10 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false @@ -90059,9 +101132,9 @@ "type": "chat" }, { - "id": "nvidia/llama-3.1-nemotron-ultra-253b-v1", - "name": "NVIDIA: Llama 3.1 Nemotron Ultra 253B v1", - "display_name": "NVIDIA: Llama 3.1 Nemotron Ultra 253B v1", + "id": "inflection/inflection-3-pi", + "name": "Inflection: Inflection 3 Pi", + "display_name": "Inflection: Inflection 3 Pi", "modalities": { "input": [ "text" @@ -90071,20 +101144,19 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 8000, + "output": 1024 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "nvidia/llama-3.3-nemotron-super-49b-v1.5", - "name": "NVIDIA: Llama 3.3 Nemotron Super 49B V1.5", - "display_name": "NVIDIA: Llama 3.3 Nemotron Super 49B V1.5", + "id": "inflection/inflection-3-productivity", + "name": "Inflection: Inflection 3 Productivity", + "display_name": "Inflection: Inflection 3 Productivity", "modalities": { "input": [ "text" @@ -90094,20 +101166,19 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 8000, + "output": 1024 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "nvidia/nemotron-3-nano-30b-a3b", - "name": "NVIDIA: Nemotron 3 Nano 30B A3B", - "display_name": "NVIDIA: Nemotron 3 Nano 30B A3B", + "id": "kwaipilot/kat-coder-pro", + "name": "Kwaipilot: KAT-Coder-Pro V1", + "display_name": "Kwaipilot: KAT-Coder-Pro V1", "modalities": { "input": [ "text" @@ -90117,20 +101188,19 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 128000 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "nvidia/nemotron-3-nano-30b-a3b:free", - "name": "NVIDIA: Nemotron 3 Nano 30B A3B (free)", - "display_name": "NVIDIA: Nemotron 3 Nano 30B A3B (free)", + "id": "liquid/lfm-2.2-6b", + "name": "LiquidAI: LFM2-2.6B", + "display_name": "LiquidAI: LFM2-2.6B", "modalities": { "input": [ "text" @@ -90140,70 +101210,64 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 32768, + "output": 32768 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "nvidia/nemotron-nano-12b-v2-vl", - "name": "NVIDIA: Nemotron Nano 12B 2 VL", - "display_name": "NVIDIA: Nemotron Nano 12B 2 VL", + "id": "liquid/lfm-2.5-1.2b-instruct:free", + "name": "LiquidAI: LFM2.5-1.2B-Instruct (free)", + "display_name": "LiquidAI: LFM2.5-1.2B-Instruct (free)", "modalities": { "input": [ - "image", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 32768, + "output": 32768 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "nvidia/nemotron-nano-12b-v2-vl:free", - "name": "NVIDIA: Nemotron Nano 12B 2 VL (free)", - "display_name": "NVIDIA: Nemotron Nano 12B 2 VL (free)", + "id": "liquid/lfm-2.5-1.2b-thinking:free", + "name": "LiquidAI: LFM2.5-1.2B-Thinking (free)", + "display_name": "LiquidAI: LFM2.5-1.2B-Thinking (free)", "modalities": { "input": [ - "image", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 32768, + "output": 32768 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "nvidia/nemotron-nano-9b-v2", - "name": "NVIDIA: Nemotron Nano 9B V2", - "display_name": "NVIDIA: Nemotron Nano 9B V2", + "id": "liquid/lfm2-8b-a1b", + "name": "LiquidAI: LFM2-8B-A1B", + "display_name": "LiquidAI: LFM2-8B-A1B", "modalities": { "input": [ "text" @@ -90213,20 +101277,19 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 32768, + "output": 32768 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "nvidia/nemotron-nano-9b-v2:free", - "name": "NVIDIA: Nemotron Nano 9B V2 (free)", - "display_name": "NVIDIA: Nemotron Nano 9B V2 (free)", + "id": "mancer/weaver", + "name": "Mancer: Weaver (alpha)", + "display_name": "Mancer: Weaver (alpha)", "modalities": { "input": [ "text" @@ -90236,46 +101299,43 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 8000, + "output": 2000 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "openai/chatgpt-4o-latest", - "name": "OpenAI: ChatGPT-4o", - "display_name": "OpenAI: ChatGPT-4o", + "id": "meituan/longcat-flash-chat", + "name": "Meituan: LongCat Flash Chat", + "display_name": "Meituan: LongCat Flash Chat", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 32768 }, "tool_call": false, "reasoning": { "supported": false }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/codex-mini", - "name": "OpenAI: Codex Mini", - "display_name": "OpenAI: Codex Mini", + "id": "meta-llama/llama-3-70b-instruct", + "name": "Meta: Llama 3 70B Instruct", + "display_name": "Meta: Llama 3 70B Instruct", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -90283,20 +101343,19 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 8192, + "output": 8000 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-3.5-turbo", - "name": "OpenAI: GPT-3.5 Turbo", - "display_name": "OpenAI: GPT-3.5 Turbo", + "id": "meta-llama/llama-3-8b-instruct", + "name": "Meta: Llama 3 8B Instruct", + "display_name": "Meta: Llama 3 8B Instruct", "modalities": { "input": [ "text" @@ -90306,8 +101365,8 @@ ] }, "limit": { - "context": 16385, - "output": 4096 + "context": 8192, + "output": 16384 }, "tool_call": true, "reasoning": { @@ -90316,9 +101375,9 @@ "type": "chat" }, { - "id": "openai/gpt-3.5-turbo-0613", - "name": "OpenAI: GPT-3.5 Turbo (older v0613)", - "display_name": "OpenAI: GPT-3.5 Turbo (older v0613)", + "id": "meta-llama/llama-3.1-405b", + "name": "Meta: Llama 3.1 405B (base)", + "display_name": "Meta: Llama 3.1 405B (base)", "modalities": { "input": [ "text" @@ -90328,19 +101387,19 @@ ] }, "limit": { - "context": 4095, - "output": 4096 + "context": 32768, + "output": 32768 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo-16k", - "name": "OpenAI: GPT-3.5 Turbo 16k", - "display_name": "OpenAI: GPT-3.5 Turbo 16k", + "id": "meta-llama/llama-3.1-405b-instruct", + "name": "Meta: Llama 3.1 405B Instruct", + "display_name": "Meta: Llama 3.1 405B Instruct", "modalities": { "input": [ "text" @@ -90350,8 +101409,8 @@ ] }, "limit": { - "context": 16385, - "output": 4096 + "context": 131000, + "output": 131000 }, "tool_call": true, "reasoning": { @@ -90360,9 +101419,9 @@ "type": "chat" }, { - "id": "openai/gpt-3.5-turbo-instruct", - "name": "OpenAI: GPT-3.5 Turbo Instruct", - "display_name": "OpenAI: GPT-3.5 Turbo Instruct", + "id": "meta-llama/llama-3.1-70b-instruct", + "name": "Meta: Llama 3.1 70B Instruct", + "display_name": "Meta: Llama 3.1 70B Instruct", "modalities": { "input": [ "text" @@ -90372,19 +101431,19 @@ ] }, "limit": { - "context": 4095, - "output": 4096 + "context": 131072, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "openai/gpt-4", - "name": "OpenAI: GPT-4", - "display_name": "OpenAI: GPT-4", + "id": "meta-llama/llama-3.1-8b-instruct", + "name": "Meta: Llama 3.1 8B Instruct", + "display_name": "Meta: Llama 3.1 8B Instruct", "modalities": { "input": [ "text" @@ -90394,8 +101453,8 @@ ] }, "limit": { - "context": 8191, - "output": 4096 + "context": 16384, + "output": 16384 }, "tool_call": true, "reasoning": { @@ -90404,31 +101463,32 @@ "type": "chat" }, { - "id": "openai/gpt-4-0314", - "name": "OpenAI: GPT-4 (older v0314)", - "display_name": "OpenAI: GPT-4 (older v0314)", + "id": "meta-llama/llama-3.2-11b-vision-instruct", + "name": "Meta: Llama 3.2 11B Vision Instruct", + "display_name": "Meta: Llama 3.2 11B Vision Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8191, - "output": 4096 + "context": 131072, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "openai/gpt-4-1106-preview", - "name": "OpenAI: GPT-4 Turbo (older v1106)", - "display_name": "OpenAI: GPT-4 Turbo (older v1106)", + "id": "meta-llama/llama-3.2-1b-instruct", + "name": "Meta: Llama 3.2 1B Instruct", + "display_name": "Meta: Llama 3.2 1B Instruct", "modalities": { "input": [ "text" @@ -90438,42 +101498,41 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 60000, + "output": 60000 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "openai/gpt-4-turbo", - "name": "OpenAI: GPT-4 Turbo", - "display_name": "OpenAI: GPT-4 Turbo", + "id": "meta-llama/llama-3.2-3b-instruct", + "name": "Meta: Llama 3.2 3B Instruct", + "display_name": "Meta: Llama 3.2 3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-4-turbo-preview", - "name": "OpenAI: GPT-4 Turbo Preview", - "display_name": "OpenAI: GPT-4 Turbo Preview", + "id": "meta-llama/llama-3.2-3b-instruct:free", + "name": "Meta: Llama 3.2 3B Instruct (free)", + "display_name": "Meta: Llama 3.2 3B Instruct (free)", "modalities": { "input": [ "text" @@ -90483,22 +101542,21 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 131072 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "openai/gpt-4.1", - "name": "OpenAI: GPT-4.1", - "display_name": "OpenAI: GPT-4.1", + "id": "meta-llama/llama-3.3-70b-instruct", + "name": "Meta: Llama 3.3 70B Instruct", + "display_name": "Meta: Llama 3.3 70B Instruct", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -90506,23 +101564,21 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 131072, + "output": 16384 }, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-4.1-mini", - "name": "OpenAI: GPT-4.1 Mini", - "display_name": "OpenAI: GPT-4.1 Mini", + "id": "meta-llama/llama-3.3-70b-instruct:free", + "name": "Meta: Llama 3.3 70B Instruct (free)", + "display_name": "Meta: Llama 3.3 70B Instruct (free)", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -90530,44 +101586,42 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 128000, + "output": 128000 }, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-4.1-nano", - "name": "OpenAI: GPT-4.1 Nano", - "display_name": "OpenAI: GPT-4.1 Nano", + "id": "meta-llama/llama-4-maverick", + "name": "Meta: Llama 4 Maverick", + "display_name": "Meta: Llama 4 Maverick", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 1048576, + "output": 16384 }, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, "type": "imageGeneration" }, { - "id": "openai/gpt-4o", - "name": "OpenAI: GPT-4o", - "display_name": "OpenAI: GPT-4o", + "id": "meta-llama/llama-4-scout", + "name": "Meta: Llama 4 Scout", + "display_name": "Meta: Llama 4 Scout", "modalities": { "input": [ "text", @@ -90578,95 +101632,88 @@ ] }, "limit": { - "context": 128000, + "context": 327680, "output": 16384 }, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, "type": "imageGeneration" }, { - "id": "openai/gpt-4o-2024-05-13", - "name": "OpenAI: GPT-4o (2024-05-13)", - "display_name": "OpenAI: GPT-4o (2024-05-13)", + "id": "meta-llama/llama-guard-2-8b", + "name": "Meta: LlamaGuard 2 8B", + "display_name": "Meta: LlamaGuard 2 8B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-4o-2024-08-06", - "name": "OpenAI: GPT-4o (2024-08-06)", - "display_name": "OpenAI: GPT-4o (2024-08-06)", + "id": "meta-llama/llama-guard-3-8b", + "name": "Llama Guard 3 8B", + "display_name": "Llama Guard 3 8B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 131072 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-4o-2024-11-20", - "name": "OpenAI: GPT-4o (2024-11-20)", - "display_name": "OpenAI: GPT-4o (2024-11-20)", + "id": "meta-llama/llama-guard-4-12b", + "name": "Meta: Llama Guard 4 12B", + "display_name": "Meta: Llama Guard 4 12B", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 163840, + "output": 163840 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, "type": "imageGeneration" }, { - "id": "openai/gpt-4o-audio-preview", - "name": "OpenAI: GPT-4o Audio", - "display_name": "OpenAI: GPT-4o Audio", + "id": "microsoft/phi-4", + "name": "Microsoft: Phi 4", + "display_name": "Microsoft: Phi 4", "modalities": { "input": [ - "audio", "text" ], "output": [ @@ -90674,42 +101721,41 @@ ] }, "limit": { - "context": 128000, + "context": 16384, "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false - } + }, + "type": "chat" }, { - "id": "openai/gpt-4o-mini", - "name": "OpenAI: GPT-4o-mini", - "display_name": "OpenAI: GPT-4o-mini", + "id": "microsoft/wizardlm-2-8x22b", + "name": "WizardLM-2 8x22B", + "display_name": "WizardLM-2 8x22B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 65536, "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-4o-mini-2024-07-18", - "name": "OpenAI: GPT-4o-mini (2024-07-18)", - "display_name": "OpenAI: GPT-4o-mini (2024-07-18)", + "id": "minimax/minimax-01", + "name": "MiniMax: MiniMax-01", + "display_name": "MiniMax: MiniMax-01", "modalities": { "input": [ "text", @@ -90720,20 +101766,19 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1000192, + "output": 1000192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, "type": "imageGeneration" }, - { - "id": "openai/gpt-4o-mini-search-preview", - "name": "OpenAI: GPT-4o-mini Search Preview", - "display_name": "OpenAI: GPT-4o-mini Search Preview", + { + "id": "minimax/minimax-m1", + "name": "MiniMax: MiniMax M1", + "display_name": "MiniMax: MiniMax M1", "modalities": { "input": [ "text" @@ -90743,19 +101788,20 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1000000, + "output": 40000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "openai/gpt-4o-search-preview", - "name": "OpenAI: GPT-4o Search Preview", - "display_name": "OpenAI: GPT-4o Search Preview", + "id": "minimax/minimax-m2", + "name": "MiniMax: MiniMax M2", + "display_name": "MiniMax: MiniMax M2", "modalities": { "input": [ "text" @@ -90765,73 +101811,70 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 196608, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "openai/gpt-4o:extended", - "name": "OpenAI: GPT-4o (extended)", - "display_name": "OpenAI: GPT-4o (extended)", + "id": "minimax/minimax-m2-her", + "name": "MiniMax: MiniMax M2-her", + "display_name": "MiniMax: MiniMax M2-her", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 65536, + "output": 2048 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-5", - "name": "OpenAI: GPT-5", - "display_name": "OpenAI: GPT-5", + "id": "minimax/minimax-m2.1", + "name": "MiniMax: MiniMax M2.1", + "display_name": "MiniMax: MiniMax M2.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 196608, + "output": 196608 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "effort": "medium", - "verbosity": "medium" + "default": true }, - "attachment": true, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-5-chat", - "name": "OpenAI: GPT-5 Chat", - "display_name": "OpenAI: GPT-5 Chat", + "id": "mistralai/codestral-2508", + "name": "Mistral: Codestral 2508", + "display_name": "Mistral: Codestral 2508", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -90839,98 +101882,89 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 256000, + "output": 256000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-5-codex", - "name": "OpenAI: GPT-5 Codex", - "display_name": "OpenAI: GPT-5 Codex", + "id": "mistralai/devstral-2512", + "name": "Mistral: Devstral 2 2512", + "display_name": "Mistral: Devstral 2 2512", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "effort": "medium", - "verbosity": "medium" + "supported": false }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-5-image", - "name": "OpenAI: GPT-5 Image", - "display_name": "OpenAI: GPT-5 Image", + "id": "mistralai/devstral-medium", + "name": "Mistral: Devstral Medium", + "display_name": "Mistral: Devstral Medium", "modalities": { "input": [ - "image", "text" ], "output": [ - "image", "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-5-image-mini", - "name": "OpenAI: GPT-5 Image Mini", - "display_name": "OpenAI: GPT-5 Image Mini", + "id": "mistralai/devstral-small", + "name": "Mistral: Devstral Small 1.1", + "display_name": "Mistral: Devstral Small 1.1", "modalities": { "input": [ - "image", "text" ], "output": [ - "image", "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "OpenAI: GPT-5 Mini", - "display_name": "OpenAI: GPT-5 Mini", + "id": "mistralai/ministral-14b-2512", + "name": "Mistral: Ministral 3 14B 2512", + "display_name": "Mistral: Ministral 3 14B 2512", "modalities": { "input": [ "text", @@ -90941,80 +101975,69 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 262144 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "effort": "medium", - "verbosity": "medium" + "supported": false }, - "attachment": true, "type": "imageGeneration" }, { - "id": "openai/gpt-5-nano", - "name": "OpenAI: GPT-5 Nano", - "display_name": "OpenAI: GPT-5 Nano", + "id": "mistralai/ministral-3b", + "name": "Mistral: Ministral 3B", + "display_name": "Mistral: Ministral 3B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "effort": "medium", - "verbosity": "medium" + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-5-pro", - "name": "OpenAI: GPT-5 Pro", - "display_name": "OpenAI: GPT-5 Pro", + "id": "mistralai/ministral-3b-2512", + "name": "Mistral: Ministral 3 3B 2512", + "display_name": "Mistral: Ministral 3 3B 2512", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "effort": "medium", - "verbosity": "medium" + "supported": false }, - "attachment": true, "type": "imageGeneration" }, { - "id": "openai/gpt-5.1", - "name": "OpenAI: GPT-5.1", - "display_name": "OpenAI: GPT-5.1", + "id": "mistralai/ministral-8b", + "name": "Mistral: Ministral 8B", + "display_name": "Mistral: Ministral 8B", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -91022,96 +102045,92 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-5.1-chat", - "name": "OpenAI: GPT-5.1 Chat", - "display_name": "OpenAI: GPT-5.1 Chat", + "id": "mistralai/ministral-8b-2512", + "name": "Mistral: Ministral 3 8B 2512", + "display_name": "Mistral: Ministral 3 8B 2512", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 262144 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, "type": "imageGeneration" }, { - "id": "openai/gpt-5.1-codex", - "name": "OpenAI: GPT-5.1-Codex", - "display_name": "OpenAI: GPT-5.1-Codex", + "id": "mistralai/mistral-7b-instruct", + "name": "Mistral: Mistral 7B Instruct", + "display_name": "Mistral: Mistral 7B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32768, + "output": 4096 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-5.1-codex-max", - "name": "OpenAI: GPT-5.1-Codex-Max", - "display_name": "OpenAI: GPT-5.1-Codex-Max", + "id": "mistralai/mistral-7b-instruct-v0.1", + "name": "Mistral: Mistral 7B Instruct v0.1", + "display_name": "Mistral: Mistral 7B Instruct v0.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 2824, + "output": 2824 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-5.1-codex-mini", - "name": "OpenAI: GPT-5.1-Codex-Mini", - "display_name": "OpenAI: GPT-5.1-Codex-Mini", + "id": "mistralai/mistral-7b-instruct-v0.2", + "name": "Mistral: Mistral 7B Instruct v0.2", + "display_name": "Mistral: Mistral 7B Instruct v0.2", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -91119,23 +102138,22 @@ ] }, "limit": { - "context": 400000, - "output": 100000 + "context": 32768, + "output": 32768 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "OpenAI: GPT-5.2", - "display_name": "OpenAI: GPT-5.2", + "id": "mistralai/mistral-7b-instruct-v0.3", + "name": "Mistral: Mistral 7B Instruct v0.3", + "display_name": "Mistral: Mistral 7B Instruct v0.3", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -91143,24 +102161,22 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32768, + "output": 4096 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-5.2-chat", - "name": "OpenAI: GPT-5.2 Chat", - "display_name": "OpenAI: GPT-5.2 Chat", + "id": "mistralai/mistral-large", + "name": "Mistral Large", + "display_name": "Mistral Large", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -91169,22 +102185,21 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-5.2-pro", - "name": "OpenAI: GPT-5.2 Pro", - "display_name": "OpenAI: GPT-5.2 Pro", + "id": "mistralai/mistral-large-2407", + "name": "Mistral Large 2407", + "display_name": "Mistral Large 2407", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -91192,21 +102207,20 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "OpenAI: gpt-oss-120b", - "display_name": "OpenAI: gpt-oss-120b", + "id": "mistralai/mistral-large-2411", + "name": "Mistral Large 2411", + "display_name": "Mistral Large 2411", "modalities": { "input": [ "text" @@ -91219,43 +102233,45 @@ "context": 131072, "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "openai/gpt-oss-120b:exacto", - "name": "OpenAI: gpt-oss-120b (exacto)", - "display_name": "OpenAI: gpt-oss-120b (exacto)", + "id": "mistralai/mistral-large-2512", + "name": "Mistral: Mistral Large 3 2512", + "display_name": "Mistral: Mistral Large 3 2512", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 262144 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "openai/gpt-oss-120b:free", - "name": "OpenAI: gpt-oss-120b (free)", - "display_name": "OpenAI: gpt-oss-120b (free)", + "id": "mistralai/mistral-medium-3", + "name": "Mistral: Mistral Medium 3", + "display_name": "Mistral: Mistral Medium 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -91265,20 +102281,21 @@ "context": 131072, "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "openai/gpt-oss-20b", - "name": "OpenAI: gpt-oss-20b", - "display_name": "OpenAI: gpt-oss-20b", + "id": "mistralai/mistral-medium-3.1", + "name": "Mistral: Mistral Medium 3.1", + "display_name": "Mistral: Mistral Medium 3.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -91288,17 +102305,17 @@ "context": 131072, "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "openai/gpt-oss-20b:free", - "name": "OpenAI: gpt-oss-20b (free)", - "display_name": "OpenAI: gpt-oss-20b (free)", + "id": "mistralai/mistral-nemo", + "name": "Mistral: Mistral Nemo", + "display_name": "Mistral: Mistral Nemo", "modalities": { "input": [ "text" @@ -91309,19 +102326,19 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "openai/gpt-oss-safeguard-20b", - "name": "OpenAI: gpt-oss-safeguard-20b", - "display_name": "OpenAI: gpt-oss-safeguard-20b", + "id": "mistralai/mistral-saba", + "name": "Mistral: Saba", + "display_name": "Mistral: Saba", "modalities": { "input": [ "text" @@ -91331,44 +102348,43 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 32768, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "openai/o1", - "name": "OpenAI: o1", - "display_name": "OpenAI: o1", + "id": "mistralai/mistral-small-24b-instruct-2501", + "name": "Mistral: Mistral Small 3", + "display_name": "Mistral: Mistral Small 3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 32768, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/o1-pro", - "name": "OpenAI: o1-pro", - "display_name": "OpenAI: o1-pro", + "id": "mistralai/mistral-small-3.1-24b-instruct", + "name": "Mistral: Mistral Small 3.1 24B", + "display_name": "Mistral: Mistral Small 3.1 24B", "modalities": { "input": [ "text", @@ -91379,48 +102395,44 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "effort": "medium" + "supported": false }, - "attachment": true, "type": "imageGeneration" }, { - "id": "openai/o3", - "name": "OpenAI: o3", - "display_name": "OpenAI: o3", + "id": "mistralai/mistral-small-3.1-24b-instruct:free", + "name": "Mistral: Mistral Small 3.1 24B (free)", + "display_name": "Mistral: Mistral Small 3.1 24B (free)", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "effort": "medium" + "supported": false }, - "attachment": true, "type": "imageGeneration" }, { - "id": "openai/o3-deep-research", - "name": "OpenAI: o3 Deep Research", - "display_name": "OpenAI: o3 Deep Research", + "id": "mistralai/mistral-small-3.2-24b-instruct", + "name": "Mistral: Mistral Small 3.2 24B", + "display_name": "Mistral: Mistral Small 3.2 24B", "modalities": { "input": [ "image", @@ -91431,21 +102443,20 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, "type": "imageGeneration" }, { - "id": "openai/o3-mini", - "name": "OpenAI: o3 Mini", - "display_name": "OpenAI: o3 Mini", + "id": "mistralai/mistral-small-creative", + "name": "Mistral: Mistral Small Creative", + "display_name": "Mistral: Mistral Small Creative", "modalities": { "input": [ "text" @@ -91455,20 +102466,20 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 32768, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, "type": "chat" }, { - "id": "openai/o3-mini-high", - "name": "OpenAI: o3 Mini High", - "display_name": "OpenAI: o3 Mini High", + "id": "mistralai/mistral-tiny", + "name": "Mistral Tiny", + "display_name": "Mistral Tiny", "modalities": { "input": [ "text" @@ -91478,49 +102489,45 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 32768, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, "type": "chat" }, { - "id": "openai/o3-pro", - "name": "OpenAI: o3 Pro", - "display_name": "OpenAI: o3 Pro", + "id": "mistralai/mixtral-8x22b-instruct", + "name": "Mistral: Mixtral 8x22B Instruct", + "display_name": "Mistral: Mixtral 8x22B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 65536, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "effort": "medium" + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/o4-mini", - "name": "OpenAI: o4 Mini", - "display_name": "OpenAI: o4 Mini", + "id": "mistralai/mixtral-8x7b-instruct", + "name": "Mistral: Mixtral 8x7B Instruct", + "display_name": "Mistral: Mixtral 8x7B Instruct", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -91528,95 +102535,91 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 32768, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "effort": "medium" + "supported": false }, - "attachment": true, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/o4-mini-deep-research", - "name": "OpenAI: o4 Mini Deep Research", - "display_name": "OpenAI: o4 Mini Deep Research", + "id": "mistralai/pixtral-12b", + "name": "Mistral: Pixtral 12B", + "display_name": "Mistral: Pixtral 12B", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 32768, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, "type": "imageGeneration" }, { - "id": "openai/o4-mini-high", - "name": "OpenAI: o4 Mini High", - "display_name": "OpenAI: o4 Mini High", + "id": "mistralai/pixtral-large-2411", + "name": "Mistral: Pixtral Large 2411", + "display_name": "Mistral: Pixtral Large 2411", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, "type": "imageGeneration" }, { - "id": "opengvlab/internvl3-78b", - "name": "OpenGVLab: InternVL3 78B", - "display_name": "OpenGVLab: InternVL3 78B", + "id": "mistralai/voxtral-small-24b-2507", + "name": "Mistral: Voxtral Small 24B 2507", + "display_name": "Mistral: Voxtral Small 24B 2507", "modalities": { "input": [ - "image", - "text" + "text", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 32000, + "output": 32000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false - }, - "type": "imageGeneration" + } }, { - "id": "openrouter/auto", - "name": "Auto Router", - "display_name": "Auto Router", + "id": "moonshotai/kimi-dev-72b", + "name": "MoonshotAI: Kimi Dev 72B", + "display_name": "MoonshotAI: Kimi Dev 72B", "modalities": { "input": [ "text" @@ -91626,19 +102629,20 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131072, + "output": 131072 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "openrouter/bodybuilder", - "name": "Body Builder (beta)", - "display_name": "Body Builder (beta)", + "id": "moonshotai/kimi-k2", + "name": "MoonshotAI: Kimi K2 0711", + "display_name": "MoonshotAI: Kimi K2 0711", "modalities": { "input": [ "text" @@ -91648,42 +102652,41 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131072, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "perplexity/sonar", - "name": "Perplexity: Sonar", - "display_name": "Perplexity: Sonar", + "id": "moonshotai/kimi-k2-0905", + "name": "MoonshotAI: Kimi K2 0905", + "display_name": "MoonshotAI: Kimi K2 0905", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 127072, - "output": 127072 + "context": 262144, + "output": 262144 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "perplexity/sonar-deep-research", - "name": "Perplexity: Sonar Deep Research", - "display_name": "Perplexity: Sonar Deep Research", + "id": "moonshotai/kimi-k2-0905:exacto", + "name": "MoonshotAI: Kimi K2 0905 (exacto)", + "display_name": "MoonshotAI: Kimi K2 0905 (exacto)", "modalities": { "input": [ "text" @@ -91693,43 +102696,42 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 262144, + "output": 262144 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "perplexity/sonar-pro", - "name": "Perplexity: Sonar Pro", - "display_name": "Perplexity: Sonar Pro", + "id": "moonshotai/kimi-k2-thinking", + "name": "MoonshotAI: Kimi K2 Thinking", + "display_name": "MoonshotAI: Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8000 + "context": 262144, + "output": 65535 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "perplexity/sonar-pro-search", - "name": "Perplexity: Sonar Pro Search", - "display_name": "Perplexity: Sonar Pro Search", + "id": "moonshotai/kimi-k2.5", + "name": "MoonshotAI: Kimi K2.5", + "display_name": "MoonshotAI: Kimi K2.5", "modalities": { "input": [ "text", @@ -91740,10 +102742,10 @@ ] }, "limit": { - "context": 200000, - "output": 8000 + "context": 262144, + "output": 65535 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -91751,33 +102753,31 @@ "type": "imageGeneration" }, { - "id": "perplexity/sonar-reasoning-pro", - "name": "Perplexity: Sonar Reasoning Pro", - "display_name": "Perplexity: Sonar Reasoning Pro", + "id": "morph/morph-v3-fast", + "name": "Morph: Morph V3 Fast", + "display_name": "Morph: Morph V3 Fast", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 81920, + "output": 38000 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "prime-intellect/intellect-3", - "name": "Prime Intellect: INTELLECT-3", - "display_name": "Prime Intellect: INTELLECT-3", + "id": "morph/morph-v3-large", + "name": "Morph: Morph V3 Large", + "display_name": "Morph: Morph V3 Large", "modalities": { "input": [ "text" @@ -91787,21 +102787,19 @@ ] }, "limit": { - "context": 131072, + "context": 262144, "output": 131072 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "qwen/qwen-2.5-72b-instruct", - "name": "Qwen2.5 72B Instruct", - "display_name": "Qwen2.5 72B Instruct", + "id": "neversleep/llama-3.1-lumimaid-8b", + "name": "NeverSleep: Lumimaid v0.2 8B", + "display_name": "NeverSleep: Lumimaid v0.2 8B", "modalities": { "input": [ "text" @@ -91812,18 +102810,18 @@ }, "limit": { "context": 32768, - "output": 16384 + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "qwen/qwen-2.5-7b-instruct", - "name": "Qwen: Qwen2.5 7B Instruct", - "display_name": "Qwen: Qwen2.5 7B Instruct", + "id": "neversleep/noromaid-20b", + "name": "Noromaid 20B", + "display_name": "Noromaid 20B", "modalities": { "input": [ "text" @@ -91833,19 +102831,19 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 4096, + "output": 2048 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "qwen/qwen-2.5-coder-32b-instruct", - "name": "Qwen2.5 Coder 32B Instruct", - "display_name": "Qwen2.5 Coder 32B Instruct", + "id": "nex-agi/deepseek-v3.1-nex-n1", + "name": "Nex AGI: DeepSeek V3.1 Nex N1", + "display_name": "Nex AGI: DeepSeek V3.1 Nex N1", "modalities": { "input": [ "text" @@ -91855,23 +102853,22 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 131072, + "output": 163840 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "qwen/qwen-2.5-vl-7b-instruct", - "name": "Qwen: Qwen2.5-VL 7B Instruct", - "display_name": "Qwen: Qwen2.5-VL 7B Instruct", + "id": "nousresearch/deephermes-3-mistral-24b-preview", + "name": "Nous: DeepHermes 3 Mistral 24B Preview", + "display_name": "Nous: DeepHermes 3 Mistral 24B Preview", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -91881,39 +102878,39 @@ "context": 32768, "output": 32768 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "qwen/qwen-2.5-vl-7b-instruct:free", - "name": "Qwen: Qwen2.5-VL 7B Instruct (free)", - "display_name": "Qwen: Qwen2.5-VL 7B Instruct (free)", + "id": "nousresearch/hermes-2-pro-llama-3-8b", + "name": "NousResearch: Hermes 2 Pro - Llama-3 8B", + "display_name": "NousResearch: Hermes 2 Pro - Llama-3 8B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "qwen/qwen-max", - "name": "Qwen: Qwen-Max", - "display_name": "Qwen: Qwen-Max", + "id": "nousresearch/hermes-3-llama-3.1-405b", + "name": "Nous: Hermes 3 405B Instruct", + "display_name": "Nous: Hermes 3 405B Instruct", "modalities": { "input": [ "text" @@ -91923,19 +102920,19 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 131072, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "qwen/qwen-plus", - "name": "Qwen: Qwen-Plus", - "display_name": "Qwen: Qwen-Plus", + "id": "nousresearch/hermes-3-llama-3.1-405b:free", + "name": "Nous: Hermes 3 405B Instruct (free)", + "display_name": "Nous: Hermes 3 405B Instruct (free)", "modalities": { "input": [ "text" @@ -91946,18 +102943,18 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 131072 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "qwen/qwen-plus-2025-07-28", - "name": "Qwen: Qwen Plus 0728", - "display_name": "Qwen: Qwen Plus 0728", + "id": "nousresearch/hermes-3-llama-3.1-70b", + "name": "Nous: Hermes 3 70B Instruct", + "display_name": "Nous: Hermes 3 70B Instruct", "modalities": { "input": [ "text" @@ -91967,19 +102964,19 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 65536, + "output": 65536 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "qwen/qwen-plus-2025-07-28:thinking", - "name": "Qwen: Qwen Plus 0728 (thinking)", - "display_name": "Qwen: Qwen Plus 0728 (thinking)", + "id": "nousresearch/hermes-4-405b", + "name": "Nous: Hermes 4 405B", + "display_name": "Nous: Hermes 4 405B", "modalities": { "input": [ "text" @@ -91989,10 +102986,10 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 131072, + "output": 131072 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -92000,9 +102997,9 @@ "type": "chat" }, { - "id": "qwen/qwen-turbo", - "name": "Qwen: Qwen-Turbo", - "display_name": "Qwen: Qwen-Turbo", + "id": "nousresearch/hermes-4-70b", + "name": "Nous: Hermes 4 70B", + "display_name": "Nous: Hermes 4 70B", "modalities": { "input": [ "text" @@ -92012,23 +103009,23 @@ ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 131072, + "output": 131072 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "qwen/qwen-vl-max", - "name": "Qwen: Qwen VL Max", - "display_name": "Qwen: Qwen VL Max", + "id": "nvidia/llama-3.1-nemotron-70b-instruct", + "name": "NVIDIA: Llama 3.1 Nemotron 70B Instruct", + "display_name": "NVIDIA: Llama 3.1 Nemotron 70B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -92036,41 +103033,41 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 16384 }, "tool_call": true, "reasoning": { "supported": false }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "qwen/qwen-vl-plus", - "name": "Qwen: Qwen VL Plus", - "display_name": "Qwen: Qwen VL Plus", + "id": "nvidia/llama-3.1-nemotron-ultra-253b-v1", + "name": "NVIDIA: Llama 3.1 Nemotron Ultra 253B v1", + "display_name": "NVIDIA: Llama 3.1 Nemotron Ultra 253B v1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 7500, - "output": 1500 + "context": 131072, + "output": 131072 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "qwen/qwen2.5-coder-7b-instruct", - "name": "Qwen: Qwen2.5 Coder 7B Instruct", - "display_name": "Qwen: Qwen2.5 Coder 7B Instruct", + "id": "nvidia/llama-3.3-nemotron-super-49b-v1.5", + "name": "NVIDIA: Llama 3.3 Nemotron Super 49B V1.5", + "display_name": "NVIDIA: Llama 3.3 Nemotron Super 49B V1.5", "modalities": { "input": [ "text" @@ -92080,111 +103077,116 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 131072, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "qwen/qwen2.5-vl-32b-instruct", - "name": "Qwen: Qwen2.5 VL 32B Instruct", - "display_name": "Qwen: Qwen2.5 VL 32B Instruct", + "id": "nvidia/nemotron-3-nano-30b-a3b", + "name": "NVIDIA: Nemotron 3 Nano 30B A3B", + "display_name": "NVIDIA: Nemotron 3 Nano 30B A3B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 262144, + "output": 262144 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "qwen/qwen2.5-vl-72b-instruct", - "name": "Qwen: Qwen2.5 VL 72B Instruct", - "display_name": "Qwen: Qwen2.5 VL 72B Instruct", + "id": "nvidia/nemotron-3-nano-30b-a3b:free", + "name": "NVIDIA: Nemotron 3 Nano 30B A3B (free)", + "display_name": "NVIDIA: Nemotron 3 Nano 30B A3B (free)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 256000, + "output": 256000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "qwen/qwen3-14b", - "name": "Qwen: Qwen3 14B", - "display_name": "Qwen: Qwen3 14B", + "id": "nvidia/nemotron-nano-12b-v2-vl", + "name": "NVIDIA: Nemotron Nano 12B 2 VL", + "display_name": "NVIDIA: Nemotron Nano 12B 2 VL", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 131072, + "output": 131072 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "qwen/qwen3-235b-a22b", - "name": "Qwen: Qwen3 235B A22B", - "display_name": "Qwen: Qwen3 235B A22B", + "id": "nvidia/nemotron-nano-12b-v2-vl:free", + "name": "NVIDIA: Nemotron Nano 12B 2 VL (free)", + "display_name": "NVIDIA: Nemotron Nano 12B 2 VL (free)", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 128000, + "output": 128000 }, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "qwen/qwen3-235b-a22b-2507", - "name": "Qwen: Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen: Qwen3 235B A22B Instruct 2507", + "id": "nvidia/nemotron-nano-9b-v2", + "name": "NVIDIA: Nemotron Nano 9B V2", + "display_name": "NVIDIA: Nemotron Nano 9B V2", "modalities": { "input": [ "text" @@ -92194,8 +103196,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 131072 }, "tool_call": true, "reasoning": { @@ -92205,9 +103207,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-thinking-2507", - "name": "Qwen: Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen: Qwen3 235B A22B Thinking 2507", + "id": "nvidia/nemotron-nano-9b-v2:free", + "name": "NVIDIA: Nemotron Nano 9B V2 (free)", + "display_name": "NVIDIA: Nemotron Nano 9B V2 (free)", "modalities": { "input": [ "text" @@ -92217,8 +103219,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 128000 }, "tool_call": true, "reasoning": { @@ -92228,32 +103230,32 @@ "type": "chat" }, { - "id": "qwen/qwen3-30b-a3b", - "name": "Qwen: Qwen3 30B A3B", - "display_name": "Qwen: Qwen3 30B A3B", + "id": "openai/chatgpt-4o-latest", + "name": "OpenAI: ChatGPT-4o", + "display_name": "OpenAI: ChatGPT-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 128000, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "qwen/qwen3-30b-a3b-instruct-2507", - "name": "Qwen: Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen: Qwen3 30B A3B Instruct 2507", + "id": "openai/gpt-3.5-turbo", + "name": "OpenAI: GPT-3.5 Turbo", + "display_name": "OpenAI: GPT-3.5 Turbo", "modalities": { "input": [ "text" @@ -92263,8 +103265,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 16385, + "output": 4096 }, "tool_call": true, "reasoning": { @@ -92273,9 +103275,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-30b-a3b-thinking-2507", - "name": "Qwen: Qwen3 30B A3B Thinking 2507", - "display_name": "Qwen: Qwen3 30B A3B Thinking 2507", + "id": "openai/gpt-3.5-turbo-0613", + "name": "OpenAI: GPT-3.5 Turbo (older v0613)", + "display_name": "OpenAI: GPT-3.5 Turbo (older v0613)", "modalities": { "input": [ "text" @@ -92285,20 +103287,19 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 4095, + "output": 4096 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "qwen/qwen3-32b", - "name": "Qwen: Qwen3 32B", - "display_name": "Qwen: Qwen3 32B", + "id": "openai/gpt-3.5-turbo-16k", + "name": "OpenAI: GPT-3.5 Turbo 16k", + "display_name": "OpenAI: GPT-3.5 Turbo 16k", "modalities": { "input": [ "text" @@ -92308,20 +103309,19 @@ ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 16385, + "output": 4096 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "qwen/qwen3-4b:free", - "name": "Qwen: Qwen3 4B (free)", - "display_name": "Qwen: Qwen3 4B (free)", + "id": "openai/gpt-3.5-turbo-instruct", + "name": "OpenAI: GPT-3.5 Turbo Instruct", + "display_name": "OpenAI: GPT-3.5 Turbo Instruct", "modalities": { "input": [ "text" @@ -92331,20 +103331,19 @@ ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 4095, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "qwen/qwen3-8b", - "name": "Qwen: Qwen3 8B", - "display_name": "Qwen: Qwen3 8B", + "id": "openai/gpt-4", + "name": "OpenAI: GPT-4", + "display_name": "OpenAI: GPT-4", "modalities": { "input": [ "text" @@ -92354,20 +103353,19 @@ ] }, "limit": { - "context": 128000, - "output": 20000 + "context": 8191, + "output": 4096 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "qwen/qwen3-coder", - "name": "Qwen: Qwen3 Coder 480B A35B", - "display_name": "Qwen: Qwen3 Coder 480B A35B", + "id": "openai/gpt-4-0314", + "name": "OpenAI: GPT-4 (older v0314)", + "display_name": "OpenAI: GPT-4 (older v0314)", "modalities": { "input": [ "text" @@ -92377,20 +103375,19 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 8191, + "output": 4096 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "qwen/qwen3-coder-30b-a3b-instruct", - "name": "Qwen: Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen: Qwen3 Coder 30B A3B Instruct", + "id": "openai/gpt-4-1106-preview", + "name": "OpenAI: GPT-4 Turbo (older v1106)", + "display_name": "OpenAI: GPT-4 Turbo (older v1106)", "modalities": { "input": [ "text" @@ -92400,8 +103397,8 @@ ] }, "limit": { - "context": 160000, - "output": 32768 + "context": 128000, + "output": 4096 }, "tool_call": true, "reasoning": { @@ -92410,12 +103407,13 @@ "type": "chat" }, { - "id": "qwen/qwen3-coder-flash", - "name": "Qwen: Qwen3 Coder Flash", - "display_name": "Qwen: Qwen3 Coder Flash", + "id": "openai/gpt-4-turbo", + "name": "OpenAI: GPT-4 Turbo", + "display_name": "OpenAI: GPT-4 Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -92423,18 +103421,18 @@ }, "limit": { "context": 128000, - "output": 65536 + "output": 4096 }, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "qwen/qwen3-coder-plus", - "name": "Qwen: Qwen3 Coder Plus", - "display_name": "Qwen: Qwen3 Coder Plus", + "id": "openai/gpt-4-turbo-preview", + "name": "OpenAI: GPT-4 Turbo Preview", + "display_name": "OpenAI: GPT-4 Turbo Preview", "modalities": { "input": [ "text" @@ -92445,7 +103443,7 @@ }, "limit": { "context": 128000, - "output": 65536 + "output": 4096 }, "tool_call": true, "reasoning": { @@ -92454,11 +103452,12 @@ "type": "chat" }, { - "id": "qwen/qwen3-coder:exacto", - "name": "Qwen: Qwen3 Coder 480B A35B (exacto)", - "display_name": "Qwen: Qwen3 Coder 480B A35B (exacto)", + "id": "openai/gpt-4.1", + "name": "OpenAI: GPT-4.1", + "display_name": "OpenAI: GPT-4.1", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -92466,22 +103465,23 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 1047576, + "output": 32768 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "qwen/qwen3-coder:free", - "name": "Qwen: Qwen3 Coder 480B A35B (free)", - "display_name": "Qwen: Qwen3 Coder 480B A35B (free)", + "id": "openai/gpt-4.1-mini", + "name": "OpenAI: GPT-4.1 Mini", + "display_name": "OpenAI: GPT-4.1 Mini", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -92489,21 +103489,23 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 1047576, + "output": 32768 }, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "qwen/qwen3-max", - "name": "Qwen: Qwen3 Max", - "display_name": "Qwen: Qwen3 Max", + "id": "openai/gpt-4.1-nano", + "name": "OpenAI: GPT-4.1 Nano", + "display_name": "OpenAI: GPT-4.1 Nano", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -92511,65 +103513,68 @@ ] }, "limit": { - "context": 256000, + "context": 1047576, "output": 32768 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "qwen/qwen3-next-80b-a3b-instruct", - "name": "Qwen: Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen: Qwen3 Next 80B A3B Instruct", + "id": "openai/gpt-4o", + "name": "OpenAI: GPT-4o", + "display_name": "OpenAI: GPT-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 16384 }, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "qwen/qwen3-next-80b-a3b-thinking", - "name": "Qwen: Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen: Qwen3 Next 80B A3B Thinking", + "id": "openai/gpt-4o-2024-05-13", + "name": "OpenAI: GPT-4o (2024-05-13)", + "display_name": "OpenAI: GPT-4o (2024-05-13)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 4096 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "qwen/qwen3-vl-235b-a22b-instruct", - "name": "Qwen: Qwen3 VL 235B A22B Instruct", - "display_name": "Qwen: Qwen3 VL 235B A22B Instruct", + "id": "openai/gpt-4o-2024-08-06", + "name": "OpenAI: GPT-4o (2024-08-06)", + "display_name": "OpenAI: GPT-4o (2024-08-06)", "modalities": { "input": [ "text", @@ -92580,20 +103585,20 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "attachment": true, "type": "imageGeneration" }, { - "id": "qwen/qwen3-vl-235b-a22b-thinking", - "name": "Qwen: Qwen3 VL 235B A22B Thinking", - "display_name": "Qwen: Qwen3 VL 235B A22B Thinking", + "id": "openai/gpt-4o-2024-11-20", + "name": "OpenAI: GPT-4o (2024-11-20)", + "display_name": "OpenAI: GPT-4o (2024-11-20)", "modalities": { "input": [ "text", @@ -92604,21 +103609,43 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, + "attachment": true, "type": "imageGeneration" }, { - "id": "qwen/qwen3-vl-30b-a3b-instruct", - "name": "Qwen: Qwen3 VL 30B A3B Instruct", - "display_name": "Qwen: Qwen3 VL 30B A3B Instruct", + "id": "openai/gpt-4o-audio-preview", + "name": "OpenAI: GPT-4o Audio", + "display_name": "OpenAI: GPT-4o Audio", + "modalities": { + "input": [ + "audio", + "text" + ], + "output": [ + "text", + "audio" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "tool_call": true, + "reasoning": { + "supported": false + } + }, + { + "id": "openai/gpt-4o-mini", + "name": "OpenAI: GPT-4o-mini", + "display_name": "OpenAI: GPT-4o-mini", "modalities": { "input": [ "text", @@ -92629,20 +103656,20 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "attachment": true, "type": "imageGeneration" }, { - "id": "qwen/qwen3-vl-30b-a3b-thinking", - "name": "Qwen: Qwen3 VL 30B A3B Thinking", - "display_name": "Qwen: Qwen3 VL 30B A3B Thinking", + "id": "openai/gpt-4o-mini-2024-07-18", + "name": "OpenAI: GPT-4o-mini (2024-07-18)", + "display_name": "OpenAI: GPT-4o-mini (2024-07-18)", "modalities": { "input": [ "text", @@ -92653,47 +103680,44 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, + "attachment": true, "type": "imageGeneration" }, { - "id": "qwen/qwen3-vl-32b-instruct", - "name": "Qwen: Qwen3 VL 32B Instruct", - "display_name": "Qwen: Qwen3 VL 32B Instruct", + "id": "openai/gpt-4o-mini-search-preview", + "name": "OpenAI: GPT-4o-mini Search Preview", + "display_name": "OpenAI: GPT-4o-mini Search Preview", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "qwen/qwen3-vl-8b-instruct", - "name": "Qwen: Qwen3 VL 8B Instruct", - "display_name": "Qwen: Qwen3 VL 8B Instruct", + "id": "openai/gpt-4o-search-preview", + "name": "OpenAI: GPT-4o Search Preview", + "display_name": "OpenAI: GPT-4o Search Preview", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -92701,70 +103725,73 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "qwen/qwen3-vl-8b-thinking", - "name": "Qwen: Qwen3 VL 8B Thinking", - "display_name": "Qwen: Qwen3 VL 8B Thinking", + "id": "openai/gpt-4o:extended", + "name": "OpenAI: GPT-4o (extended)", + "display_name": "OpenAI: GPT-4o (extended)", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 128000, + "output": 64000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, + "attachment": true, "type": "imageGeneration" }, { - "id": "qwen/qwq-32b", - "name": "Qwen: QwQ 32B", - "display_name": "Qwen: QwQ 32B", + "id": "openai/gpt-5", + "name": "OpenAI: GPT-5", + "display_name": "OpenAI: GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 400000, + "output": 128000 }, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "effort": "medium", + "verbosity": "medium" }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "raifle/sorcererlm-8x22b", - "name": "SorcererLM 8x22B", - "display_name": "SorcererLM 8x22B", + "id": "openai/gpt-5-chat", + "name": "OpenAI: GPT-5 Chat", + "display_name": "OpenAI: GPT-5 Chat", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -92772,109 +103799,155 @@ ] }, "limit": { - "context": 16000, - "output": 16000 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "relace/relace-apply-3", - "name": "Relace: Relace Apply 3", - "display_name": "Relace: Relace Apply 3", + "id": "openai/gpt-5-codex", + "name": "OpenAI: GPT-5 Codex", + "display_name": "OpenAI: GPT-5 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 400000, "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true, + "effort": "medium", + "verbosity": "medium" }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "relace/relace-search", - "name": "Relace: Relace Search", - "display_name": "Relace: Relace Search", + "id": "openai/gpt-5-image", + "name": "OpenAI: GPT-5 Image", + "display_name": "OpenAI: GPT-5 Image", "modalities": { "input": [ + "image", "text" ], "output": [ + "image", "text" ] }, "limit": { - "context": 256000, + "context": 400000, "output": 128000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "sao10k/l3-euryale-70b", - "name": "Sao10k: Llama 3 Euryale 70B v2.1", - "display_name": "Sao10k: Llama 3 Euryale 70B v2.1", + "id": "openai/gpt-5-image-mini", + "name": "OpenAI: GPT-5 Image Mini", + "display_name": "OpenAI: GPT-5 Image Mini", "modalities": { "input": [ + "image", "text" ], "output": [ + "image", "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 400000, + "output": 128000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "sao10k/l3-lunaris-8b", - "name": "Sao10K: Llama 3 8B Lunaris", - "display_name": "Sao10K: Llama 3 8B Lunaris", + "id": "openai/gpt-5-mini", + "name": "OpenAI: GPT-5 Mini", + "display_name": "OpenAI: GPT-5 Mini", "modalities": { "input": [ + "text", + "image" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true, + "effort": "medium", + "verbosity": "medium" + }, + "attachment": true, + "type": "imageGeneration" + }, + { + "id": "openai/gpt-5-nano", + "name": "OpenAI: GPT-5 Nano", + "display_name": "OpenAI: GPT-5 Nano", + "modalities": { + "input": [ + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true, + "effort": "medium", + "verbosity": "medium" }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "sao10k/l3.1-70b-hanami-x1", - "name": "Sao10K: Llama 3.1 70B Hanami x1", - "display_name": "Sao10K: Llama 3.1 70B Hanami x1", + "id": "openai/gpt-5-pro", + "name": "OpenAI: GPT-5 Pro", + "display_name": "OpenAI: GPT-5 Pro", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -92882,21 +103955,26 @@ ] }, "limit": { - "context": 16000, - "output": 16000 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true, + "effort": "medium", + "verbosity": "medium" }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "sao10k/l3.1-euryale-70b", - "name": "Sao10K: Llama 3.1 Euryale 70B v2.2", - "display_name": "Sao10K: Llama 3.1 Euryale 70B v2.2", + "id": "openai/gpt-5.1", + "name": "OpenAI: GPT-5.1", + "display_name": "OpenAI: GPT-5.1", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -92904,21 +103982,24 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 400000, + "output": 128000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "sao10k/l3.3-euryale-70b", - "name": "Sao10K: Llama 3.3 Euryale 70B", - "display_name": "Sao10K: Llama 3.3 Euryale 70B", + "id": "openai/gpt-5.1-chat", + "name": "OpenAI: GPT-5.1 Chat", + "display_name": "OpenAI: GPT-5.1 Chat", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -92926,31 +104007,32 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 16384 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "stepfun-ai/step3", - "name": "StepFun: Step3", - "display_name": "StepFun: Step3", + "id": "openai/gpt-5.1-codex", + "name": "OpenAI: GPT-5.1-Codex", + "display_name": "OpenAI: GPT-5.1-Codex", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 400000, + "output": 128000 }, "tool_call": true, "reasoning": { @@ -92960,34 +104042,36 @@ "type": "imageGeneration" }, { - "id": "switchpoint/router", - "name": "Switchpoint Router", - "display_name": "Switchpoint Router", + "id": "openai/gpt-5.1-codex-max", + "name": "OpenAI: GPT-5.1-Codex-Max", + "display_name": "OpenAI: GPT-5.1-Codex-Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "tencent/hunyuan-a13b-instruct", - "name": "Tencent: Hunyuan A13B Instruct", - "display_name": "Tencent: Hunyuan A13B Instruct", + "id": "openai/gpt-5.1-codex-mini", + "name": "OpenAI: GPT-5.1-Codex-Mini", + "display_name": "OpenAI: GPT-5.1-Codex-Mini", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -92995,22 +104079,23 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 400000, + "output": 100000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "thedrummer/cydonia-24b-v4.1", - "name": "TheDrummer: Cydonia 24B V4.1", - "display_name": "TheDrummer: Cydonia 24B V4.1", + "id": "openai/gpt-5.2", + "name": "OpenAI: GPT-5.2", + "display_name": "OpenAI: GPT-5.2", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -93018,21 +104103,24 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "thedrummer/rocinante-12b", - "name": "TheDrummer: Rocinante 12B", - "display_name": "TheDrummer: Rocinante 12B", + "id": "openai/gpt-5.2-chat", + "name": "OpenAI: GPT-5.2 Chat", + "display_name": "OpenAI: GPT-5.2 Chat", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -93040,43 +104128,47 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 16384 }, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "thedrummer/skyfall-36b-v2", - "name": "TheDrummer: Skyfall 36B V2", - "display_name": "TheDrummer: Skyfall 36B V2", + "id": "openai/gpt-5.2-codex", + "name": "OpenAI: GPT-5.2-Codex", + "display_name": "OpenAI: GPT-5.2-Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "thedrummer/unslopnemo-12b", - "name": "TheDrummer: UnslopNemo 12B", - "display_name": "TheDrummer: UnslopNemo 12B", + "id": "openai/gpt-5.2-pro", + "name": "OpenAI: GPT-5.2 Pro", + "display_name": "OpenAI: GPT-5.2 Pro", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -93084,66 +104176,67 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 400000, + "output": 128000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "thudm/glm-4.1v-9b-thinking", - "name": "THUDM: GLM 4.1V 9B Thinking", - "display_name": "THUDM: GLM 4.1V 9B Thinking", + "id": "openai/gpt-audio", + "name": "OpenAI: GPT Audio", + "display_name": "OpenAI: GPT Audio", "modalities": { "input": [ - "image", - "text" + "text", + "audio" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 65536, - "output": 8000 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "type": "imageGeneration" + "supported": false + } }, { - "id": "tngtech/deepseek-r1t-chimera", - "name": "TNG: DeepSeek R1T Chimera", - "display_name": "TNG: DeepSeek R1T Chimera", + "id": "openai/gpt-audio-mini", + "name": "OpenAI: GPT Audio Mini", + "display_name": "OpenAI: GPT Audio Mini", "modalities": { "input": [ - "text" + "text", + "audio" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "type": "chat" + "supported": false + } }, { - "id": "tngtech/deepseek-r1t-chimera:free", - "name": "TNG: DeepSeek R1T Chimera (free)", - "display_name": "TNG: DeepSeek R1T Chimera (free)", + "id": "openai/gpt-oss-120b", + "name": "OpenAI: gpt-oss-120b", + "display_name": "OpenAI: gpt-oss-120b", "modalities": { "input": [ "text" @@ -93153,10 +104246,10 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 131072, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -93164,9 +104257,9 @@ "type": "chat" }, { - "id": "tngtech/deepseek-r1t2-chimera", - "name": "TNG: DeepSeek R1T2 Chimera", - "display_name": "TNG: DeepSeek R1T2 Chimera", + "id": "openai/gpt-oss-120b:exacto", + "name": "OpenAI: gpt-oss-120b (exacto)", + "display_name": "OpenAI: gpt-oss-120b (exacto)", "modalities": { "input": [ "text" @@ -93176,8 +104269,8 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 131072, + "output": 131072 }, "tool_call": true, "reasoning": { @@ -93187,9 +104280,9 @@ "type": "chat" }, { - "id": "tngtech/deepseek-r1t2-chimera:free", - "name": "TNG: DeepSeek R1T2 Chimera (free)", - "display_name": "TNG: DeepSeek R1T2 Chimera (free)", + "id": "openai/gpt-oss-120b:free", + "name": "OpenAI: gpt-oss-120b (free)", + "display_name": "OpenAI: gpt-oss-120b (free)", "modalities": { "input": [ "text" @@ -93199,10 +104292,10 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 131072, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -93210,9 +104303,9 @@ "type": "chat" }, { - "id": "tngtech/tng-r1t-chimera", - "name": "TNG: R1T Chimera", - "display_name": "TNG: R1T Chimera", + "id": "openai/gpt-oss-20b", + "name": "OpenAI: gpt-oss-20b", + "display_name": "OpenAI: gpt-oss-20b", "modalities": { "input": [ "text" @@ -93222,8 +104315,8 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 131072, + "output": 131072 }, "tool_call": true, "reasoning": { @@ -93233,9 +104326,9 @@ "type": "chat" }, { - "id": "tngtech/tng-r1t-chimera:free", - "name": "TNG: R1T Chimera (free)", - "display_name": "TNG: R1T Chimera (free)", + "id": "openai/gpt-oss-20b:free", + "name": "OpenAI: gpt-oss-20b (free)", + "display_name": "OpenAI: gpt-oss-20b (free)", "modalities": { "input": [ "text" @@ -93245,8 +104338,8 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 131072, + "output": 131072 }, "tool_call": true, "reasoning": { @@ -93256,9 +104349,9 @@ "type": "chat" }, { - "id": "undi95/remm-slerp-l2-13b", - "name": "ReMM SLERP 13B", - "display_name": "ReMM SLERP 13B", + "id": "openai/gpt-oss-safeguard-20b", + "name": "OpenAI: gpt-oss-safeguard-20b", + "display_name": "OpenAI: gpt-oss-safeguard-20b", "modalities": { "input": [ "text" @@ -93268,65 +104361,73 @@ ] }, "limit": { - "context": 6144, - "output": 6144 + "context": 131072, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "x-ai/grok-3", - "name": "xAI: Grok 3", - "display_name": "xAI: Grok 3", + "id": "openai/o1", + "name": "OpenAI: o1", + "display_name": "OpenAI: o1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 100000 }, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "x-ai/grok-3-beta", - "name": "xAI: Grok 3 Beta", - "display_name": "xAI: Grok 3 Beta", + "id": "openai/o1-pro", + "name": "OpenAI: o1-pro", + "display_name": "OpenAI: o1-pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 100000 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true, + "effort": "medium" }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "x-ai/grok-3-mini", - "name": "xAI: Grok 3 Mini", - "display_name": "xAI: Grok 3 Mini", + "id": "openai/o3", + "name": "OpenAI: o3", + "display_name": "OpenAI: o3", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -93334,22 +104435,25 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 100000 }, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "effort": "medium" }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "x-ai/grok-3-mini-beta", - "name": "xAI: Grok 3 Mini Beta", - "display_name": "xAI: Grok 3 Mini Beta", + "id": "openai/o3-deep-research", + "name": "OpenAI: o3 Deep Research", + "display_name": "OpenAI: o3 Deep Research", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -93357,23 +104461,23 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 100000 }, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "x-ai/grok-4", - "name": "xAI: Grok 4", - "display_name": "xAI: Grok 4", + "id": "openai/o3-mini", + "name": "OpenAI: o3 Mini", + "display_name": "OpenAI: o3 Mini", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -93381,44 +104485,43 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 200000, + "output": 100000 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "imageGeneration" + "attachment": true, + "type": "chat" }, { - "id": "x-ai/grok-4-fast", - "name": "xAI: Grok 4 Fast", - "display_name": "xAI: Grok 4 Fast", + "id": "openai/o3-mini-high", + "name": "OpenAI: o3 Mini High", + "display_name": "OpenAI: o3 Mini High", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 200000, + "output": 100000 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "imageGeneration" + "attachment": true, + "type": "chat" }, { - "id": "x-ai/grok-4.1-fast", - "name": "xAI: Grok 4.1 Fast", - "display_name": "xAI: Grok 4.1 Fast", + "id": "openai/o3-pro", + "name": "OpenAI: o3 Pro", + "display_name": "OpenAI: o3 Pro", "modalities": { "input": [ "text", @@ -93429,23 +104532,25 @@ ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 200000, + "output": 100000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "effort": "medium" }, + "attachment": true, "type": "imageGeneration" }, { - "id": "x-ai/grok-code-fast-1", - "name": "xAI: Grok Code Fast 1", - "display_name": "xAI: Grok Code Fast 1", + "id": "openai/o4-mini", + "name": "OpenAI: o4 Mini", + "display_name": "OpenAI: o4 Mini", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -93453,22 +104558,25 @@ ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 200000, + "output": 100000 }, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "effort": "medium" }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "xiaomi/mimo-v2-flash:free", - "name": "Xiaomi: MiMo-V2-Flash (free)", - "display_name": "Xiaomi: MiMo-V2-Flash (free)", + "id": "openai/o4-mini-deep-research", + "name": "OpenAI: o4 Mini Deep Research", + "display_name": "OpenAI: o4 Mini Deep Research", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -93476,22 +104584,24 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 100000 }, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "z-ai/glm-4-32b", - "name": "Z.AI: GLM 4 32B", - "display_name": "Z.AI: GLM 4 32B", + "id": "openai/o4-mini-high", + "name": "OpenAI: o4 Mini High", + "display_name": "OpenAI: o4 Mini High", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -93499,22 +104609,24 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 200000, + "output": 100000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "z-ai/glm-4.5", - "name": "Z.AI: GLM 4.5", - "display_name": "Z.AI: GLM 4.5", + "id": "opengvlab/internvl3-78b", + "name": "OpenGVLab: InternVL3 78B", + "display_name": "OpenGVLab: InternVL3 78B", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -93522,45 +104634,47 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 32768, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "z-ai/glm-4.5-air", - "name": "Z.AI: GLM 4.5 Air", - "display_name": "Z.AI: GLM 4.5 Air", + "id": "openrouter/auto", + "name": "Auto Router", + "display_name": "Auto Router", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 8192, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "attachment": true, + "type": "imageGeneration" }, { - "id": "z-ai/glm-4.5-air:free", - "name": "Z.AI: GLM 4.5 Air (free)", - "display_name": "Z.AI: GLM 4.5 Air (free)", + "id": "openrouter/bodybuilder", + "name": "Body Builder (beta)", + "display_name": "Body Builder (beta)", "modalities": { "input": [ "text" @@ -93570,21 +104684,19 @@ ] }, "limit": { - "context": 131072, - "output": 96000 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "z-ai/glm-4.5v", - "name": "Z.AI: GLM 4.5V", - "display_name": "Z.AI: GLM 4.5V", + "id": "openrouter/free", + "name": "Free Models Router", + "display_name": "Free Models Router", "modalities": { "input": [ "text", @@ -93595,10 +104707,9 @@ ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 8192, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -93607,33 +104718,32 @@ "type": "imageGeneration" }, { - "id": "z-ai/glm-4.6", - "name": "Z.AI: GLM 4.6", - "display_name": "Z.AI: GLM 4.6", + "id": "perplexity/sonar", + "name": "Perplexity: Sonar", + "display_name": "Perplexity: Sonar", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 65536 + "context": 127072, + "output": 127072 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "z-ai/glm-4.6:exacto", - "name": "Z.AI: GLM 4.6 (exacto)", - "display_name": "Z.AI: GLM 4.6 (exacto)", + "id": "perplexity/sonar-deep-research", + "name": "Perplexity: Sonar Deep Research", + "display_name": "Perplexity: Sonar Deep Research", "modalities": { "input": [ "text" @@ -93643,11 +104753,10 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 128000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -93655,89 +104764,56 @@ "type": "chat" }, { - "id": "z-ai/glm-4.6v", - "name": "Z.AI: GLM 4.6V", - "display_name": "Z.AI: GLM 4.6V", + "id": "perplexity/sonar-pro", + "name": "Perplexity: Sonar Pro", + "display_name": "Perplexity: Sonar Pro", "modalities": { "input": [ - "image", "text", - "video" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 131072 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "type": "imageGeneration" - }, - { - "id": "z-ai/glm-4.7", - "name": "Z.AI: GLM 4.7", - "display_name": "Z.AI: GLM 4.7", - "modalities": { - "input": [ - "text" + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 65535 + "context": 200000, + "output": 8000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" - } - ] - }, - "jiekou": { - "id": "jiekou", - "name": "Jiekou", - "display_name": "Jiekou", - "models": [ + "type": "imageGeneration" + }, { - "id": "baichuan/baichuan-m2-32b", - "name": "BaiChuan M2 32B", - "display_name": "BaiChuan M2 32B", + "id": "perplexity/sonar-pro-search", + "name": "Perplexity: Sonar Pro Search", + "display_name": "Perplexity: Sonar Pro Search", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 8000 }, "tool_call": false, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "claude-3-5-haiku-20241022", - "name": "claude-3-5-haiku-20241022", - "display_name": "claude-3-5-haiku-20241022", + "id": "perplexity/sonar-reasoning-pro", + "name": "Perplexity: Sonar Reasoning Pro", + "display_name": "Perplexity: Sonar Reasoning Pro", "modalities": { "input": [ "text", @@ -93748,54 +104824,55 @@ ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 128000, + "output": 128000 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "claude-3-5-sonnet-20241022", - "name": "claude-3-5-sonnet-20241022", - "display_name": "claude-3-5-sonnet-20241022", + "id": "prime-intellect/intellect-3", + "name": "Prime Intellect: INTELLECT-3", + "display_name": "Prime Intellect: INTELLECT-3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 131072, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "claude-3-7-sonnet-20250219", - "name": "claude-3-7-sonnet-20250219", - "display_name": "claude-3-7-sonnet-20250219", + "id": "qwen/qwen-2.5-72b-instruct", + "name": "Qwen2.5 72B Instruct", + "display_name": "Qwen2.5 72B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32768, + "output": 16384 }, "tool_call": true, "reasoning": { @@ -93804,21 +104881,20 @@ "type": "chat" }, { - "id": "claude-3-haiku-20240307", - "name": "claude-3-haiku-20240307", - "display_name": "claude-3-haiku-20240307", + "id": "qwen/qwen-2.5-7b-instruct", + "name": "Qwen: Qwen2.5 7B Instruct", + "display_name": "Qwen: Qwen2.5 7B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 32768, + "output": 32768 }, "tool_call": true, "reasoning": { @@ -93827,32 +104903,31 @@ "type": "chat" }, { - "id": "claude-haiku-4-5-20251001", - "name": "claude-haiku-4-5-20251001", - "display_name": "claude-haiku-4-5-20251001", + "id": "qwen/qwen-2.5-coder-32b-instruct", + "name": "Qwen2.5 Coder 32B Instruct", + "display_name": "Qwen2.5 Coder 32B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 20000, - "output": 20000 + "context": 32768, + "output": 32768 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "claude-opus-4-1-20250805", - "name": "claude-opus-4-1-20250805", - "display_name": "claude-opus-4-1-20250805", + "id": "qwen/qwen-2.5-vl-7b-instruct", + "name": "Qwen: Qwen2.5-VL 7B Instruct", + "display_name": "Qwen: Qwen2.5-VL 7B Instruct", "modalities": { "input": [ "text", @@ -93863,31 +104938,30 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 32768, + "output": 32768 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "claude-opus-4-20250514", - "name": "claude-opus-4-20250514", - "display_name": "claude-opus-4-20250514", + "id": "qwen/qwen-max", + "name": "Qwen: Qwen-Max", + "display_name": "Qwen: Qwen-Max", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 32768, + "output": 8192 }, "tool_call": true, "reasoning": { @@ -93896,21 +104970,20 @@ "type": "chat" }, { - "id": "claude-opus-4-5-20251101", - "name": "claude-opus-4-5-20251101", - "display_name": "claude-opus-4-5-20251101", + "id": "qwen/qwen-plus", + "name": "Qwen: Qwen-Plus", + "display_name": "Qwen: Qwen-Plus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 65536 + "context": 131072, + "output": 8192 }, "tool_call": true, "reasoning": { @@ -93919,21 +104992,20 @@ "type": "chat" }, { - "id": "claude-opus-4-5-20251101-dd", - "name": "claude-opus-4-5-20251101-dd", - "display_name": "claude-opus-4-5-20251101-dd", + "id": "qwen/qwen-plus-2025-07-28", + "name": "Qwen: Qwen Plus 0728", + "display_name": "Qwen: Qwen Plus 0728", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 65536 + "context": 1000000, + "output": 32768 }, "tool_call": true, "reasoning": { @@ -93942,44 +105014,43 @@ "type": "chat" }, { - "id": "claude-sonnet-4-20250514", - "name": "claude-sonnet-4-20250514", - "display_name": "claude-sonnet-4-20250514", + "id": "qwen/qwen-plus-2025-07-28:thinking", + "name": "Qwen: Qwen Plus 0728 (thinking)", + "display_name": "Qwen: Qwen Plus 0728 (thinking)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 32768 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "claude-sonnet-4-20250514-dd", - "name": "claude-sonnet-4-20250514-dd", - "display_name": "claude-sonnet-4-20250514-dd", + "id": "qwen/qwen-turbo", + "name": "Qwen: Qwen-Turbo", + "display_name": "Qwen: Qwen-Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 8192 }, "tool_call": true, "reasoning": { @@ -93988,9 +105059,9 @@ "type": "chat" }, { - "id": "claude-sonnet-4-5-20250929", - "name": "claude-sonnet-4-5-20250929", - "display_name": "claude-sonnet-4-5-20250929", + "id": "qwen/qwen-vl-max", + "name": "Qwen: Qwen VL Max", + "display_name": "Qwen: Qwen VL Max", "modalities": { "input": [ "text", @@ -94001,19 +105072,19 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 8192 }, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "claude-sonnet-4-5-20250929-dd", - "name": "claude-sonnet-4-5-20250929-dd", - "display_name": "claude-sonnet-4-5-20250929-dd", + "id": "qwen/qwen-vl-plus", + "name": "Qwen: Qwen VL Plus", + "display_name": "Qwen: Qwen VL Plus", "modalities": { "input": [ "text", @@ -94024,19 +105095,19 @@ ] }, "limit": { - "context": 20000, - "output": 20000 + "context": 7500, + "output": 1500 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "deepseek/deepseek-r1-0528", - "name": "DeepSeek R1 0528", - "display_name": "DeepSeek R1 0528", + "id": "qwen/qwen2.5-coder-7b-instruct", + "name": "Qwen: Qwen2.5 Coder 7B Instruct", + "display_name": "Qwen: Qwen2.5 Coder 7B Instruct", "modalities": { "input": [ "text" @@ -94046,135 +105117,134 @@ ] }, "limit": { - "context": 163840, + "context": 32768, "output": 32768 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "deepseek/deepseek-v3-0324", - "name": "DeepSeek V3 0324", - "display_name": "DeepSeek V3 0324", + "id": "qwen/qwen2.5-vl-32b-instruct", + "name": "Qwen: Qwen2.5 VL 32B Instruct", + "display_name": "Qwen: Qwen2.5 VL 32B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 16384, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "deepseek/deepseek-v3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "qwen/qwen2.5-vl-72b-instruct", + "name": "Qwen: Qwen2.5 VL 72B Instruct", + "display_name": "Qwen: Qwen2.5 VL 72B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163840, + "context": 32768, "output": 32768 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "doubao-1-5-pro-32k-250115", - "name": "doubao-1-5-pro-32k-250115", - "display_name": "doubao-1-5-pro-32k-250115", + "id": "qwen/qwen3-14b", + "name": "Qwen: Qwen3 14B", + "display_name": "Qwen: Qwen3 14B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 12000 + "context": 40960, + "output": 40960 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "doubao-1.5-pro-32k-character-250715", - "name": "doubao-1.5-pro-32k-character-250715", - "display_name": "doubao-1.5-pro-32k-character-250715", + "id": "qwen/qwen3-235b-a22b", + "name": "Qwen: Qwen3 235B A22B", + "display_name": "Qwen: Qwen3 235B A22B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 40960, + "output": 40960 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "doubao-seed-1-8-251228", - "name": "doubao-seed-1-8-251228", - "display_name": "doubao-seed-1-8-251228", + "id": "qwen/qwen3-235b-a22b-2507", + "name": "Qwen: Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen: Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 262144, + "output": 262144 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "baidu/ernie-4.5-300b-a47b-paddle", - "name": "ERNIE 4.5 300B A47B", - "display_name": "ERNIE 4.5 300B A47B", + "id": "qwen/qwen3-235b-a22b-thinking-2507", + "name": "Qwen: Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen: Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ "text" @@ -94184,31 +105254,31 @@ ] }, "limit": { - "context": 123000, - "output": 12000 + "context": 262144, + "output": 262144 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "baidu/ernie-4.5-vl-424b-a47b", - "name": "ERNIE 4.5 VL 424B A47B", - "display_name": "ERNIE 4.5 VL 424B A47B", + "id": "qwen/qwen3-30b-a3b", + "name": "Qwen: Qwen3 30B A3B", + "display_name": "Qwen: Qwen3 30B A3B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 123000, - "output": 16000 + "context": 40960, + "output": 40960 }, "tool_call": true, "reasoning": { @@ -94218,23 +105288,20 @@ "type": "chat" }, { - "id": "gemini-2.0-flash-20250609", - "name": "gemini-2.0-flash-20250609", - "display_name": "gemini-2.0-flash-20250609", + "id": "qwen/qwen3-30b-a3b-instruct-2507", + "name": "Qwen: Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen: Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 200000 + "context": 262144, + "output": 262144 }, "tool_call": true, "reasoning": { @@ -94243,123 +105310,112 @@ "type": "chat" }, { - "id": "gemini-2.0-flash-lite", - "name": "gemini-2.0-flash-lite", - "display_name": "gemini-2.0-flash-lite", + "id": "qwen/qwen3-30b-a3b-thinking-2507", + "name": "Qwen: Qwen3 30B A3B Thinking 2507", + "display_name": "Qwen: Qwen3 30B A3B Thinking 2507", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 32768, + "output": 32768 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "gemini-2.5-flash", - "display_name": "gemini-2.5-flash", + "id": "qwen/qwen3-32b", + "name": "Qwen: Qwen3 32B", + "display_name": "Qwen: Qwen3 32B", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 40960, + "output": 40960 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite", - "name": "gemini-2.5-flash-lite", - "display_name": "gemini-2.5-flash-lite", + "id": "qwen/qwen3-4b:free", + "name": "Qwen: Qwen3 4B (free)", + "display_name": "Qwen: Qwen3 4B (free)", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 40960, + "output": 40960 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite-preview-06-17", - "name": "gemini-2.5-flash-lite-preview-06-17", - "display_name": "gemini-2.5-flash-lite-preview-06-17", + "id": "qwen/qwen3-8b", + "name": "Qwen: Qwen3 8B", + "display_name": "Qwen: Qwen3 8B", "modalities": { "input": [ - "text", - "video", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 32000, + "output": 8192 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite-preview-09-2025", - "name": "gemini-2.5-flash-lite-preview-09-2025", - "display_name": "gemini-2.5-flash-lite-preview-09-2025", + "id": "qwen/qwen3-coder", + "name": "Qwen: Qwen3 Coder 480B A35B", + "display_name": "Qwen: Qwen3 Coder 480B A35B", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262144, + "output": 262144 }, "tool_call": true, "reasoning": { @@ -94369,23 +105425,20 @@ "type": "chat" }, { - "id": "gemini-2.5-flash-preview-05-20", - "name": "gemini-2.5-flash-preview-05-20", - "display_name": "gemini-2.5-flash-preview-05-20", + "id": "qwen/qwen3-coder-30b-a3b-instruct", + "name": "Qwen: Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen: Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 200000 + "context": 160000, + "output": 32768 }, "tool_call": true, "reasoning": { @@ -94394,23 +105447,20 @@ "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "gemini-2.5-pro", - "display_name": "gemini-2.5-pro", + "id": "qwen/qwen3-coder-flash", + "name": "Qwen: Qwen3 Coder Flash", + "display_name": "Qwen: Qwen3 Coder Flash", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 128000, + "output": 65536 }, "tool_call": true, "reasoning": { @@ -94419,24 +105469,22 @@ "type": "chat" }, { - "id": "gemini-2.5-pro-preview-06-05", - "name": "gemini-2.5-pro-preview-06-05", - "display_name": "gemini-2.5-pro-preview-06-05", + "id": "qwen/qwen3-coder-next", + "name": "Qwen: Qwen3 Coder Next", + "display_name": "Qwen: Qwen3 Coder Next", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 200000 + "context": 262144, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false @@ -94444,22 +105492,19 @@ "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "gemini-3-flash-preview", - "display_name": "gemini-3-flash-preview", + "id": "qwen/qwen3-coder-plus", + "name": "Qwen: Qwen3 Coder Plus", + "display_name": "Qwen: Qwen3 Coder Plus", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 128000, "output": 65536 }, "tool_call": true, @@ -94469,22 +105514,19 @@ "type": "chat" }, { - "id": "gemini-3-pro-preview", - "name": "gemini-3-pro-preview", - "display_name": "gemini-3-pro-preview", + "id": "qwen/qwen3-coder:exacto", + "name": "Qwen: Qwen3 Coder 480B A35B (exacto)", + "display_name": "Qwen: Qwen3 Coder 480B A35B (exacto)", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "tool_call": true, @@ -94494,104 +105536,98 @@ "type": "chat" }, { - "id": "google/gemma-3-27b-it", - "name": "Gemma 3 27B", - "display_name": "Gemma 3 27B", + "id": "qwen/qwen3-coder:free", + "name": "Qwen: Qwen3 Coder 480B A35B (free)", + "display_name": "Qwen: Qwen3 Coder 480B A35B (free)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 262000, + "output": 262000 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "google/gemma-3-12b-it", - "name": "Gemma3 12B", - "display_name": "Gemma3 12B", + "id": "qwen/qwen3-max", + "name": "Qwen: Qwen3 Max", + "display_name": "Qwen: Qwen3 Max", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "thudm/glm-4.1v-9b-thinking", - "name": "GLM 4.1V 9B Thinking", - "display_name": "GLM 4.1V 9B Thinking", + "id": "qwen/qwen3-next-80b-a3b-instruct", + "name": "Qwen: Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen: Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 8000 + "context": 262144, + "output": 262144 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "zai-org/glm-4.5v", - "name": "GLM 4.5V", - "display_name": "GLM 4.5V", + "id": "qwen/qwen3-next-80b-a3b-instruct:free", + "name": "Qwen: Qwen3 Next 80B A3B Instruct (free)", + "display_name": "Qwen: Qwen3 Next 80B A3B Instruct (free)", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 262144, + "output": 262144 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "zai-org/glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "qwen/qwen3-next-80b-a3b-thinking", + "name": "Qwen: Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen: Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ "text" @@ -94601,8 +105637,8 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 128000, + "output": 128000 }, "tool_call": true, "reasoning": { @@ -94612,32 +105648,33 @@ "type": "chat" }, { - "id": "zai-org/glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "qwen/qwen3-vl-235b-a22b-instruct", + "name": "Qwen: Qwen3 VL 235B A22B Instruct", + "display_name": "Qwen: Qwen3 VL 235B A22B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 262144 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "gpt-4.1", - "name": "gpt-4.1", - "display_name": "gpt-4.1", + "id": "qwen/qwen3-vl-235b-a22b-thinking", + "name": "Qwen: Qwen3 VL 235B A22B Thinking", + "display_name": "Qwen: Qwen3 VL 235B A22B Thinking", "modalities": { "input": [ "text", @@ -94648,19 +105685,21 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 262144, + "output": 262144 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "gpt-4.1-mini", - "name": "gpt-4.1-mini", - "display_name": "gpt-4.1-mini", + "id": "qwen/qwen3-vl-30b-a3b-instruct", + "name": "Qwen: Qwen3 VL 30B A3B Instruct", + "display_name": "Qwen: Qwen3 VL 30B A3B Instruct", "modalities": { "input": [ "text", @@ -94671,19 +105710,20 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 262144, + "output": 262144 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "gpt-4.1-nano", - "name": "gpt-4.1-nano", - "display_name": "gpt-4.1-nano", + "id": "qwen/qwen3-vl-30b-a3b-thinking", + "name": "Qwen: Qwen3 VL 30B A3B Thinking", + "display_name": "Qwen: Qwen3 VL 30B A3B Thinking", "modalities": { "input": [ "text", @@ -94694,19 +105734,21 @@ ] }, "limit": { - "context": 1047576, + "context": 131072, "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "gpt-4o", - "name": "gpt-4o", - "display_name": "gpt-4o", + "id": "qwen/qwen3-vl-32b-instruct", + "name": "Qwen: Qwen3 VL 32B Instruct", + "display_name": "Qwen: Qwen3 VL 32B Instruct", "modalities": { "input": [ "text", @@ -94717,23 +105759,23 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 262144 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "gpt-4o-mini", - "name": "gpt-4o-mini", - "display_name": "gpt-4o-mini", + "id": "qwen/qwen3-vl-8b-instruct", + "name": "Qwen: Qwen3 VL 8B Instruct", + "display_name": "Qwen: Qwen3 VL 8B Instruct", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" @@ -94741,123 +105783,121 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "gpt-5", - "name": "gpt-5", - "display_name": "gpt-5", + "id": "qwen/qwen3-vl-8b-thinking", + "name": "Qwen: Qwen3 VL 8B Thinking", + "display_name": "Qwen: Qwen3 VL 8B Thinking", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "gpt-5-chat-latest", - "name": "gpt-5-chat-latest", - "display_name": "gpt-5-chat-latest", + "id": "qwen/qwq-32b", + "name": "Qwen: QwQ 32B", + "display_name": "Qwen: QwQ 32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32768, + "output": 32768 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "gpt-5-codex", - "name": "gpt-5-codex", - "display_name": "gpt-5-codex", + "id": "raifle/sorcererlm-8x22b", + "name": "SorcererLM 8x22B", + "display_name": "SorcererLM 8x22B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16000, + "output": 16000 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "gpt-5-mini", - "display_name": "gpt-5-mini", + "id": "relace/relace-apply-3", + "name": "Relace: Relace Apply 3", + "display_name": "Relace: Relace Apply 3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 256000, "output": 128000 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "gpt-5-nano", - "name": "gpt-5-nano", - "display_name": "gpt-5-nano", + "id": "relace/relace-search", + "name": "Relace: Relace Search", + "display_name": "Relace: Relace Search", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 256000, "output": 128000 }, "tool_call": true, @@ -94867,213 +105907,202 @@ "type": "chat" }, { - "id": "gpt-5-pro", - "name": "gpt-5-pro", - "display_name": "gpt-5-pro", + "id": "sao10k/l3-euryale-70b", + "name": "Sao10k: Llama 3 Euryale 70B v2.1", + "display_name": "Sao10k: Llama 3 Euryale 70B v2.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 272000 + "context": 8192, + "output": 8192 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "gpt-5.1", - "name": "gpt-5.1", - "display_name": "gpt-5.1", + "id": "sao10k/l3-lunaris-8b", + "name": "Sao10K: Llama 3 8B Lunaris", + "display_name": "Sao10K: Llama 3 8B Lunaris", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "gpt-5.1-chat-latest", - "name": "gpt-5.1-chat-latest", - "display_name": "gpt-5.1-chat-latest", + "id": "sao10k/l3.1-70b-hanami-x1", + "name": "Sao10K: Llama 3.1 70B Hanami x1", + "display_name": "Sao10K: Llama 3.1 70B Hanami x1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 16000, "output": 16000 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "gpt-5.1-codex", - "display_name": "gpt-5.1-codex", + "id": "sao10k/l3.1-euryale-70b", + "name": "Sao10K: Llama 3.1 Euryale 70B v2.2", + "display_name": "Sao10K: Llama 3.1 Euryale 70B v2.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32768, + "output": 32768 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "gpt-5.1-codex-max", - "name": "gpt-5.1-codex-max", - "display_name": "gpt-5.1-codex-max", + "id": "sao10k/l3.3-euryale-70b", + "name": "Sao10K: Llama 3.3 Euryale 70B", + "display_name": "Sao10K: Llama 3.3 Euryale 70B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 16384 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "gpt-5.1-codex-mini", - "name": "gpt-5.1-codex-mini", - "display_name": "gpt-5.1-codex-mini", + "id": "stepfun-ai/step3", + "name": "StepFun: Step3", + "display_name": "StepFun: Step3", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 65536, + "output": 65536 }, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "gpt-5.2", - "name": "gpt-5.2", - "display_name": "gpt-5.2", + "id": "stepfun/step-3.5-flash:free", + "name": "StepFun: Step 3.5 Flash (free)", + "display_name": "StepFun: Step 3.5 Flash (free)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 256000 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "gpt-5.2-chat-latest", - "name": "gpt-5.2-chat-latest", - "display_name": "gpt-5.2-chat-latest", + "id": "switchpoint/router", + "name": "Switchpoint Router", + "display_name": "Switchpoint Router", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16000 + "context": 131072, + "output": 131072 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "gpt-5.2-pro", - "name": "gpt-5.2-pro", - "display_name": "gpt-5.2-pro", + "id": "tencent/hunyuan-a13b-instruct", + "name": "Tencent: Hunyuan A13B Instruct", + "display_name": "Tencent: Hunyuan A13B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 131072 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -95081,13 +106110,12 @@ "type": "chat" }, { - "id": "grok-3", - "name": "grok-3", - "display_name": "grok-3", + "id": "thedrummer/cydonia-24b-v4.1", + "name": "TheDrummer: Cydonia 24B V4.1", + "display_name": "TheDrummer: Cydonia 24B V4.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -95095,30 +106123,29 @@ }, "limit": { "context": 131072, - "output": 32000 + "output": 131072 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "grok-3-mini", - "name": "grok-3-mini", - "display_name": "grok-3-mini", + "id": "thedrummer/rocinante-12b", + "name": "TheDrummer: Rocinante 12B", + "display_name": "TheDrummer: Rocinante 12B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 32768, + "output": 32768 }, "tool_call": true, "reasoning": { @@ -95127,44 +106154,42 @@ "type": "chat" }, { - "id": "grok-4-0709", - "name": "grok-4-0709", - "display_name": "grok-4-0709", + "id": "thedrummer/skyfall-36b-v2", + "name": "TheDrummer: Skyfall 36B V2", + "display_name": "TheDrummer: Skyfall 36B V2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 32768, + "output": 32768 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "grok-4-1-fast-non-reasoning", - "name": "grok-4-1-fast-non-reasoning", - "display_name": "grok-4-1-fast-non-reasoning", + "id": "thedrummer/unslopnemo-12b", + "name": "TheDrummer: UnslopNemo 12B", + "display_name": "TheDrummer: UnslopNemo 12B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 32768, + "output": 32768 }, "tool_call": true, "reasoning": { @@ -95173,101 +106198,101 @@ "type": "chat" }, { - "id": "grok-4-1-fast-reasoning", - "name": "grok-4-1-fast-reasoning", - "display_name": "grok-4-1-fast-reasoning", + "id": "tngtech/deepseek-r1t-chimera", + "name": "TNG: DeepSeek R1T Chimera", + "display_name": "TNG: DeepSeek R1T Chimera", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 163840, + "output": 163840 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "grok-4-fast-non-reasoning", - "name": "grok-4-fast-non-reasoning", - "display_name": "grok-4-fast-non-reasoning", + "id": "tngtech/deepseek-r1t-chimera:free", + "name": "TNG: DeepSeek R1T Chimera (free)", + "display_name": "TNG: DeepSeek R1T Chimera (free)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 163840, + "output": 163840 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "grok-4-fast-reasoning", - "name": "grok-4-fast-reasoning", - "display_name": "grok-4-fast-reasoning", + "id": "tngtech/deepseek-r1t2-chimera", + "name": "TNG: DeepSeek R1T2 Chimera", + "display_name": "TNG: DeepSeek R1T2 Chimera", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 163840, + "output": 163840 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "grok-code-fast-1", - "name": "grok-code-fast-1", - "display_name": "grok-code-fast-1", + "id": "tngtech/deepseek-r1t2-chimera:free", + "name": "TNG: DeepSeek R1T2 Chimera (free)", + "display_name": "TNG: DeepSeek R1T2 Chimera (free)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 163840, + "output": 163840 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-0905", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "tngtech/tng-r1t-chimera", + "name": "TNG: R1T Chimera", + "display_name": "TNG: R1T Chimera", "modalities": { "input": [ "text" @@ -95277,19 +106302,20 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 163840, + "output": 65536 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "tngtech/tng-r1t-chimera:free", + "name": "TNG: R1T Chimera (free)", + "display_name": "TNG: R1T Chimera (free)", "modalities": { "input": [ "text" @@ -95299,19 +106325,20 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 163840, + "output": 65536 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "sao10k/l3-70b-euryale-v2.1", - "name": "L3 70B Euryale V2.1", - "display_name": "L3 70B Euryale V2.1", + "id": "undi95/remm-slerp-l2-13b", + "name": "ReMM SLERP 13B", + "display_name": "ReMM SLERP 13B", "modalities": { "input": [ "text" @@ -95321,19 +106348,19 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 6144, + "output": 4096 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "Sao10K/L3-8B-Stheno-v3.2", - "name": "L3 8B Stheno V3.2", - "display_name": "L3 8B Stheno V3.2", + "id": "upstage/solar-pro-3:free", + "name": "Upstage: Solar Pro 3 (free)", + "display_name": "Upstage: Solar Pro 3 (free)", "modalities": { "input": [ "text" @@ -95343,19 +106370,20 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 128000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "sao10k/l31-70b-euryale-v2.2", - "name": "L31 70B Euryale V2.2", - "display_name": "L31 70B Euryale V2.2", + "id": "writer/palmyra-x5", + "name": "Writer: Palmyra X5", + "display_name": "Writer: Palmyra X5", "modalities": { "input": [ "text" @@ -95365,19 +106393,19 @@ ] }, "limit": { - "context": 8192, + "context": 1040000, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "meta-llama/llama-3.1-8b-instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "x-ai/grok-3", + "name": "xAI: Grok 3", + "display_name": "xAI: Grok 3", "modalities": { "input": [ "text" @@ -95387,19 +106415,19 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 131072, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "meta-llama/llama-3.2-3b-instruct", - "name": "Llama 3.2 3B Instruct", - "display_name": "Llama 3.2 3B Instruct", + "id": "x-ai/grok-3-beta", + "name": "xAI: Grok 3 Beta", + "display_name": "xAI: Grok 3 Beta", "modalities": { "input": [ "text" @@ -95409,8 +106437,8 @@ ] }, "limit": { - "context": 32768, - "output": 32000 + "context": 131072, + "output": 131072 }, "tool_call": true, "reasoning": { @@ -95419,9 +106447,9 @@ "type": "chat" }, { - "id": "meta-llama/llama-3.3-70b-instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "x-ai/grok-3-mini", + "name": "xAI: Grok 3 Mini", + "display_name": "xAI: Grok 3 Mini", "modalities": { "input": [ "text" @@ -95432,110 +106460,115 @@ }, "limit": { "context": 131072, - "output": 120000 + "output": 131072 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "meta-llama/llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama 4 Maverick Instruct", - "display_name": "Llama 4 Maverick Instruct", + "id": "x-ai/grok-3-mini-beta", + "name": "xAI: Grok 3 Mini Beta", + "display_name": "xAI: Grok 3 Mini Beta", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 1048576 + "context": 131072, + "output": 131072 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "meta-llama/llama-4-scout-17b-16e-instruct", - "name": "Llama 4 Scout Instruct", - "display_name": "Llama 4 Scout Instruct", + "id": "x-ai/grok-4", + "name": "xAI: Grok 4", + "display_name": "xAI: Grok 4", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 256000, + "output": 256000 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "minimaxai/minimax-m1-80k", - "name": "MiniMax M1", - "display_name": "MiniMax M1", + "id": "x-ai/grok-4-fast", + "name": "xAI: Grok 4 Fast", + "display_name": "xAI: Grok 4 Fast", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 40000 + "context": 2000000, + "output": 30000 }, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "minimax/minimax-m2.1", - "name": "Minimax M2.1", - "display_name": "Minimax M2.1", + "id": "x-ai/grok-4.1-fast", + "name": "xAI: Grok 4.1 Fast", + "display_name": "xAI: Grok 4.1 Fast", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 2000000, + "output": 30000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "mistralai/mistral-7b-instruct", - "name": "Mistral 7B Instruct", - "display_name": "Mistral 7B Instruct", + "id": "x-ai/grok-code-fast-1", + "name": "xAI: Grok Code Fast 1", + "display_name": "xAI: Grok Code Fast 1", "modalities": { "input": [ "text" @@ -95545,19 +106578,20 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 256000, + "output": 10000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "mistralai/mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "xiaomi/mimo-v2-flash", + "name": "Xiaomi: MiMo-V2-Flash", + "display_name": "Xiaomi: MiMo-V2-Flash", "modalities": { "input": [ "text" @@ -95567,19 +106601,20 @@ ] }, "limit": { - "context": 60288, - "output": 32000 + "context": 262144, + "output": 262144 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "gryphe/mythomax-l2-13b", - "name": "Mythomax L2 13B", - "display_name": "Mythomax L2 13B", + "id": "z-ai/glm-4-32b", + "name": "Z.AI: GLM 4 32B", + "display_name": "Z.AI: GLM 4 32B", "modalities": { "input": [ "text" @@ -95589,46 +106624,47 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 128000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "nova-2-Lite", - "name": "nova-2-Lite", - "display_name": "nova-2-Lite", + "id": "z-ai/glm-4.5", + "name": "Z.AI: GLM 4.5", + "display_name": "Z.AI: GLM 4.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 131072, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "o1", - "name": "o1", - "display_name": "o1", + "id": "z-ai/glm-4.5-air", + "name": "Z.AI: GLM 4.5 Air", + "display_name": "Z.AI: GLM 4.5 Air", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -95638,20 +106674,21 @@ "context": 131072, "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "o1-mini", - "name": "o1-mini", - "display_name": "o1-mini", + "id": "z-ai/glm-4.5-air:free", + "name": "Z.AI: GLM 4.5 Air (free)", + "display_name": "Z.AI: GLM 4.5 Air (free)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -95659,18 +106696,20 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 96000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "o3", - "name": "o3", - "display_name": "o3", + "id": "z-ai/glm-4.5v", + "name": "Z.AI: GLM 4.5V", + "display_name": "Z.AI: GLM 4.5V", "modalities": { "input": [ "text", @@ -95681,55 +106720,58 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 65536, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "z-ai/glm-4.6", + "name": "Z.AI: GLM 4.6", + "display_name": "Z.AI: GLM 4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 202752, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "OpenAI GPT OSS 120B", - "display_name": "OpenAI GPT OSS 120B", + "id": "z-ai/glm-4.6:exacto", + "name": "Z.AI: GLM 4.6 (exacto)", + "display_name": "Z.AI: GLM 4.6 (exacto)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 204800, "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -95738,13 +106780,14 @@ "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "OpenAI: GPT OSS 20B", - "display_name": "OpenAI: GPT OSS 20B", + "id": "z-ai/glm-4.6v", + "name": "Z.AI: GLM 4.6V", + "display_name": "Z.AI: GLM 4.6V", "modalities": { "input": [ + "image", "text", - "image" + "video" ], "output": [ "text" @@ -95752,19 +106795,20 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "qwen/qwen-2.5-72b-instruct", - "name": "Qwen 2.5 72B Instruct", - "display_name": "Qwen 2.5 72B Instruct", + "id": "z-ai/glm-4.7", + "name": "Z.AI: GLM 4.7", + "display_name": "Z.AI: GLM 4.7", "modalities": { "input": [ "text" @@ -95774,19 +106818,21 @@ ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 202752, + "output": 65535 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" }, { - "id": "qwen/qwen-mt-plus", - "name": "Qwen MT Plus", - "display_name": "Qwen MT Plus", + "id": "z-ai/glm-4.7-flash", + "name": "Z.AI: GLM 4.7 Flash", + "display_name": "Z.AI: GLM 4.7 Flash", "modalities": { "input": [ "text" @@ -95796,30 +106842,40 @@ ] }, "limit": { - "context": 4096, - "output": 2048 + "context": 200000, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "type": "chat" - }, + } + ] + }, + "jiekou": { + "id": "jiekou", + "name": "Jiekou", + "display_name": "Jiekou", + "models": [ { - "id": "qwen/qwen2.5-7b-instruct", - "name": "Qwen2.5 7B Instruct", - "display_name": "Qwen2.5 7B Instruct", + "id": "claude-3-5-haiku-20241022", + "name": "claude-3-5-haiku-20241022", + "display_name": "claude-3-5-haiku-20241022", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 200000, + "output": 8192 }, "tool_call": true, "reasoning": { @@ -95828,67 +106884,67 @@ "type": "chat" }, { - "id": "qwen/qwen2.5-vl-72b-instruct", - "name": "Qwen2.5 VL 72B Instruct", - "display_name": "Qwen2.5 VL 72B Instruct", + "id": "claude-3-5-sonnet-20241022", + "name": "claude-3-5-sonnet-20241022", + "display_name": "claude-3-5-sonnet-20241022", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 200000, + "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-fp8", - "name": "Qwen3 235B A22B", - "display_name": "Qwen3 235B A22B", + "id": "claude-3-7-sonnet-20250219", + "name": "claude-3-7-sonnet-20250219", + "display_name": "claude-3-7-sonnet-20250219", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 40960, - "output": 20000 + "context": 200000, + "output": 64000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "claude-3-haiku-20240307", + "name": "claude-3-haiku-20240307", + "display_name": "claude-3-haiku-20240307", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 200000, + "output": 4096 }, "tool_call": true, "reasoning": { @@ -95897,112 +106953,113 @@ "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-thinking-2507", - "name": "Qwen3 235B A22b Thinking 2507", - "display_name": "Qwen3 235B A22b Thinking 2507", + "id": "claude-haiku-4-5-20251001", + "name": "claude-haiku-4-5-20251001", + "display_name": "claude-haiku-4-5-20251001", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 20000, + "output": 20000 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "qwen/qwen3-30b-a3b-fp8", - "name": "Qwen3 30B A3B", - "display_name": "Qwen3 30B A3B", + "id": "claude-opus-4-1-20250805", + "name": "claude-opus-4-1-20250805", + "display_name": "claude-opus-4-1-20250805", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 40960, - "output": 20000 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "qwen/qwen3-32b-fp8", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "claude-opus-4-20250514", + "name": "claude-opus-4-20250514", + "display_name": "claude-opus-4-20250514", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 40960, - "output": 20000 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "qwen/qwen3-8b-fp8", - "name": "Qwen3 8B", - "display_name": "Qwen3 8B", + "id": "claude-opus-4-5-20251101", + "name": "claude-opus-4-5-20251101", + "display_name": "claude-opus-4-5-20251101", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 20000 + "context": 200000, + "output": 65536 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "qwen/qwen3-coder-480b-a35b-instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "claude-sonnet-4-20250514", + "name": "claude-sonnet-4-20250514", + "display_name": "claude-sonnet-4-20250514", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 64000 }, "tool_call": true, "reasoning": { @@ -96011,20 +107068,21 @@ "type": "chat" }, { - "id": "qwen/qwen3-next-80b-a3b-instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "claude-sonnet-4-5-20250929", + "name": "claude-sonnet-4-5-20250929", + "display_name": "claude-sonnet-4-5-20250929", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 200000, + "output": 64000 }, "tool_call": true, "reasoning": { @@ -96033,9 +107091,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen3 Next 80B A3B Thinking", + "id": "deepseek/deepseek-r1-0528", + "name": "DeepSeek R1 0528", + "display_name": "DeepSeek R1 0528", "modalities": { "input": [ "text" @@ -96045,8 +107103,8 @@ ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 163840, + "output": 32768 }, "tool_call": true, "reasoning": { @@ -96056,9 +107114,9 @@ "type": "chat" }, { - "id": "sao10k/l3-8b-lunaris", - "name": "Sao10k L3 8B Lunaris", - "display_name": "Sao10k L3 8B Lunaris", + "id": "deepseek/deepseek-v3-0324", + "name": "DeepSeek V3 0324", + "display_name": "DeepSeek V3 0324", "modalities": { "input": [ "text" @@ -96068,8 +107126,8 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 163840, + "output": 163840 }, "tool_call": true, "reasoning": { @@ -96078,9 +107136,9 @@ "type": "chat" }, { - "id": "xiaomimimo/mimo-v2-flash", - "name": "XiaomiMiMo/MiMo-V2-Flash", - "display_name": "XiaomiMiMo/MiMo-V2-Flash", + "id": "deepseek/deepseek-v3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ "text" @@ -96090,8 +107148,8 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 163840, + "output": 32768 }, "tool_call": true, "reasoning": { @@ -96099,95 +107157,61 @@ "default": true }, "type": "chat" - } - ] - }, - "zenmux": { - "id": "zenmux", - "name": "ZenMux", - "display_name": "ZenMux", - "models": [ + }, { - "id": "anthropic/claude-3.5-haiku", - "name": "Anthropic: Claude 3.5 Haiku", - "display_name": "Anthropic: Claude 3.5 Haiku", + "id": "deepseek/deepseek-ocr-2", + "name": "DeepSeek-OCR 2", + "display_name": "DeepSeek-OCR 2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 8192, "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", - "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 - }, "type": "chat" }, { - "id": "anthropic/claude-3.5-sonnet", - "name": "Anthropic: Claude 3.5 Sonnet (Retiring Soon)", - "display_name": "Anthropic: Claude 3.5 Sonnet (Retiring Soon)", + "id": "doubao-1-5-pro-32k-250115", + "name": "doubao-1-5-pro-32k-250115", + "display_name": "doubao-1-5-pro-32k-250115", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 128000, + "output": 12000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, "type": "chat" }, { - "id": "anthropic/claude-3.7-sonnet", - "name": "Anthropic: Claude 3.7 Sonnet", - "display_name": "Anthropic: Claude 3.7 Sonnet", + "id": "doubao-1.5-pro-32k-character-250715", + "name": "doubao-1.5-pro-32k-character-250715", + "display_name": "doubao-1.5-pro-32k-character-250715", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -96197,498 +107221,343 @@ "context": 200000, "output": 64000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "supported": false }, "type": "chat" }, { - "id": "anthropic/claude-haiku-4.5", - "name": "Anthropic: Claude Haiku 4.5", - "display_name": "Anthropic: Claude Haiku 4.5", + "id": "doubao-seed-1-8-251228", + "name": "doubao-seed-1-8-251228", + "display_name": "doubao-seed-1-8-251228", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 256000, "output": 64000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", - "cost": { - "input": 1, - "output": 1.25, - "cache_read": 0.1, - "cache_write": 1.25 + "supported": false }, "type": "chat" }, { - "id": "anthropic/claude-opus-4", - "name": "Anthropic: Claude Opus 4", - "display_name": "Anthropic: Claude Opus 4", + "id": "baidu/ernie-4.5-300b-a47b-paddle", + "name": "ERNIE 4.5 300B A47B", + "display_name": "ERNIE 4.5 300B A47B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 123000, + "output": 12000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "supported": false }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.1", - "name": "Anthropic: Claude Opus 4.1", - "display_name": "Anthropic: Claude Opus 4.1", + "id": "baidu/ernie-4.5-vl-424b-a47b", + "name": "ERNIE 4.5 VL 424B A47B", + "display_name": "ERNIE 4.5 VL 424B A47B", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 123000, + "output": 16000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.5", - "name": "Anthropic: Claude Opus 4.5", - "display_name": "Anthropic: Claude Opus 4.5", + "id": "gemini-2.0-flash-20250609", + "name": "gemini-2.0-flash-20250609", + "display_name": "gemini-2.0-flash-20250609", "modalities": { "input": [ "text", "image", - "pdf" + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 200000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", - "cost": { - "input": 5, - "output": 25, - "cache_read": 1.5, - "cache_write": 18.75 + "supported": false }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4", - "name": "Anthropic: Claude Sonnet 4", - "display_name": "Anthropic: Claude Sonnet 4", + "id": "gemini-2.0-flash-lite", + "name": "gemini-2.0-flash-lite", + "display_name": "gemini-2.0-flash-lite", "modalities": { "input": [ "text", "image", - "pdf" + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 65535 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "supported": false }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.5", - "name": "Anthropic: Claude Sonnet 4.5", - "display_name": "Anthropic: Claude Sonnet 4.5", + "id": "gemini-2.5-flash", + "name": "gemini-2.5-flash", + "display_name": "gemini-2.5-flash", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 65535 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "supported": false }, "type": "chat" }, { - "id": "baidu/ernie-5.0-thinking-preview", - "name": "Baidu: ERNIE-5.0-Thinking-Preview", - "display_name": "Baidu: ERNIE-5.0-Thinking-Preview", + "id": "gemini-2.5-flash-lite", + "name": "gemini-2.5-flash-lite", + "display_name": "gemini-2.5-flash-lite", "modalities": { "input": [ "text", "image", - "video" + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 1048576, + "output": 65535 }, - "temperature": true, "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", - "cost": { - "input": 0.84, - "output": 3.37 - }, - "type": "chat" - }, - { - "id": "baidu/ernie-x1.1-preview", - "name": "Baidu: ERNIE-X1.1-Preview", - "display_name": "Baidu: ERNIE-X1.1-Preview", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, "reasoning": { "supported": false }, - "cost": { - "input": 0.136, - "output": 0.544 - }, "type": "chat" }, { - "id": "deepseek/deepseek-chat-v3.1", - "name": "DeepSeek: DeepSeek V3.1", - "display_name": "DeepSeek: DeepSeek V3.1", + "id": "gemini-2.5-flash-lite-preview-06-17", + "name": "gemini-2.5-flash-lite-preview-06-17", + "display_name": "gemini-2.5-flash-lite-preview-06-17", "modalities": { "input": [ - "text" + "text", + "video", + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1048576, + "output": 65535 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2", - "name": "DeepSeek: DeepSeek V3.2", - "display_name": "DeepSeek: DeepSeek V3.2", + "id": "gemini-2.5-flash-lite-preview-09-2025", + "name": "gemini-2.5-flash-lite-preview-09-2025", + "display_name": "gemini-2.5-flash-lite-preview-09-2025", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 1048576, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", - "cost": { - "input": 0.28, - "output": 0.43 - }, "type": "chat" }, { - "id": "deepseek/deepseek-chat", - "name": "DeepSeek: DeepSeek-V3.2 (Non-thinking Mode)", - "display_name": "DeepSeek: DeepSeek-V3.2 (Non-thinking Mode)", + "id": "gemini-2.5-flash-preview-05-20", + "name": "gemini-2.5-flash-preview-05-20", + "display_name": "gemini-2.5-flash-preview-05-20", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 1048576, + "output": 200000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-09-10", - "last_updated": "2025-09-10", - "cost": { - "input": 0.28, - "output": 0.42, - "cache_read": 0.03 - }, "type": "chat" }, { - "id": "deepseek/deepseek-reasoner", - "name": "DeepSeek: DeepSeek-V3.2 (Thinking Mode)", - "display_name": "DeepSeek: DeepSeek-V3.2 (Thinking Mode)", + "id": "gemini-2.5-pro", + "name": "gemini-2.5-pro", + "display_name": "gemini-2.5-pro", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 1048576, + "output": 65535 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-10-23", - "last_updated": "2025-10-23", - "cost": { - "input": 0.28, - "output": 0.42, - "cache_read": 0.03 + "supported": false }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-exp", - "name": "DeepSeek: DeepSeek-V3.2-Exp", - "display_name": "DeepSeek: DeepSeek-V3.2-Exp", + "id": "gemini-2.5-pro-preview-06-05", + "name": "gemini-2.5-pro-preview-06-05", + "display_name": "gemini-2.5-pro-preview-06-05", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 8192 + "context": 1048576, + "output": 200000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", - "cost": { - "input": 0.28, - "output": 0.42 - }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-0528", - "name": "DeepSeek: R1 0528", - "display_name": "DeepSeek: R1 0528", + "id": "gemini-3-flash-preview", + "name": "gemini-3-flash-preview", + "display_name": "gemini-3-flash-preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 1048576, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", - "cost": { - "input": 0, - "output": 0 + "supported": false }, "type": "chat" }, { - "id": "google/gemini-2.0-flash", - "name": "Google: Gemini 2.0 Flash", - "display_name": "Google: Gemini 2.0 Flash", + "id": "gemini-3-pro-preview", + "name": "gemini-3-pro-preview", + "display_name": "gemini-3-pro-preview", "modalities": { "input": [ "text", "image", - "audio", "video", - "pdf" + "audio" ], "output": [ "text" @@ -96696,322 +107565,216 @@ }, "limit": { "context": 1048576, - "output": 8192 + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", - "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 - }, "type": "chat" }, { - "id": "google/gemini-2.0-flash-lite-001", - "name": "Google: Gemini 2.0 Flash Lite", - "display_name": "Google: Gemini 2.0 Flash Lite", + "id": "google/gemma-3-27b-it", + "name": "Gemma 3 27B", + "display_name": "Gemma 3 27B", "modalities": { "input": [ "text", - "image", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 32768, + "output": 32768 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "type": "imageGeneration" + "type": "chat" }, { - "id": "google/gemini-2.5-flash", - "name": "Google: Gemini 2.5 Flash", - "display_name": "Google: Gemini 2.5 Flash", + "id": "google/gemma-3-12b-it", + "name": "Gemma3 12B", + "display_name": "Gemma3 12B", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", - "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075 + "supported": false }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-lite", - "name": "Google: Gemini 2.5 Flash Lite", - "display_name": "Google: Gemini 2.5 Flash Lite", + "id": "zai-org/glm-4.5v", + "name": "GLM 4.5V", + "display_name": "GLM 4.5V", "modalities": { "input": [ "text", "image", - "audio", - "video", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 65536, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", - "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 - }, "type": "chat" }, { - "id": "google/gemini-2.5-pro", - "name": "Google: Gemini 2.5 Pro", - "display_name": "Google: Gemini 2.5 Pro", + "id": "zai-org/glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 98304 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 - }, "type": "chat" }, { - "id": "google/gemini-3-flash-preview", - "name": "Google: Gemini 3 Flash Preview", - "display_name": "Google: Gemini 3 Flash Preview", + "id": "zai-org/glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 64000 + "context": 204800, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", - "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "cache_write": 1 - }, "type": "chat" }, { - "id": "google/gemini-3-flash-preview-free", - "name": "Google: Gemini 3 Flash Preview Free", - "display_name": "Google: Gemini 3 Flash Preview Free", + "id": "zai-org/glm-4.7-flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 64000 + "context": 200000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", - "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "cache_write": 1 - }, "type": "chat" }, { - "id": "google/gemini-3-pro-preview", - "name": "Google: Gemini 3 Pro Preview", - "display_name": "Google: Gemini 3 Pro Preview", + "id": "zai-org/glm-ocr", + "name": "GLM-OCR", + "display_name": "GLM-OCR", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 32000, + "output": 32000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", - "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2 + "supported": false }, "type": "chat" }, { - "id": "google/gemma-3-12b-it", - "name": "Google: Gemma 3 12B", - "display_name": "Google: Gemma 3 12B", + "id": "gpt-4.1", + "name": "gpt-4.1", + "display_name": "gpt-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1047576, + "output": 32768 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-03-01", - "last_updated": "2025-03-01", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "inclusionai/ling-1t", - "name": "inclusionAI: Ling-1T", - "display_name": "inclusionAI: Ling-1T", + "id": "gpt-4.1-mini", + "name": "gpt-4.1-mini", + "display_name": "gpt-4.1-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1047576, + "output": 32768 }, "tool_call": true, "reasoning": { @@ -97020,43 +107783,36 @@ "type": "chat" }, { - "id": "inclusionai/ling-flash-2.0", - "name": "inclusionAI: Ling-flash-2.0", - "display_name": "inclusionAI: Ling-flash-2.0", + "id": "gpt-4.1-nano", + "name": "gpt-4.1-nano", + "display_name": "gpt-4.1-nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1047576, + "output": 32768 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", - "cost": { - "input": 0.14, - "output": 0.57 - }, "type": "chat" }, { - "id": "inclusionai/ling-mini-2.0", - "name": "inclusionAI: Ling-mini-2.0", - "display_name": "inclusionAI: Ling-mini-2.0", + "id": "gpt-4o", + "name": "gpt-4o", + "display_name": "gpt-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -97064,151 +107820,123 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-10", - "last_updated": "2025-11-25", - "cost": { - "input": 0.07, - "output": 0.28 - }, "type": "chat" }, { - "id": "inclusionai/llada2.0-flash-cap", - "name": "inclusionAI: LLaDA2-flash-CAP", - "display_name": "inclusionAI: LLaDA2-flash-CAP", + "id": "gpt-4o-mini", + "name": "gpt-4o-mini", + "display_name": "gpt-4o-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 131072, + "output": 131072 }, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "cost": { - "input": 0.28, - "output": 2.85, - "cache_read": 0.057 - }, "type": "chat" }, { - "id": "inclusionai/ming-flash-omni-preview", - "name": "inclusionAI: Ming-flash-omni Preview", - "display_name": "inclusionAI: Ming-flash-omni Preview", + "id": "gpt-5", + "name": "gpt-5", + "display_name": "gpt-5", "modalities": { "input": [ "text", - "audio", - "video", "image" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { - "context": 64000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false - }, - "cost": { - "input": 0.8, - "output": 1.8 + "supported": true, + "default": true }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "inclusionai/ring-1t", - "name": "inclusionAI: Ring-1T", - "display_name": "inclusionAI: Ring-1T", + "id": "gpt-5-chat-latest", + "name": "gpt-5-chat-latest", + "display_name": "gpt-5-chat-latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "inclusionai/ring-flash-2.0", - "name": "inclusionAI: Ring-flash-2.0", - "display_name": "inclusionAI: Ring-flash-2.0", + "id": "gpt-5-codex", + "name": "gpt-5-codex", + "display_name": "gpt-5-codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-11-25", - "cost": { - "input": 0.14, - "output": 0.57 + "supported": false }, "type": "chat" }, { - "id": "inclusionai/ring-mini-2.0", - "name": "inclusionAI: Ring-mini-2.0", - "display_name": "inclusionAI: Ring-mini-2.0", + "id": "gpt-5-mini", + "name": "gpt-5-mini", + "display_name": "gpt-5-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 400000, + "output": 128000 }, "tool_call": true, "reasoning": { @@ -97218,104 +107946,80 @@ "type": "chat" }, { - "id": "kuaishou/kat-coder-pro-v1", - "name": "KwaiKAT: KAT-Coder-Pro-V1", - "display_name": "KwaiKAT: KAT-Coder-Pro-V1", + "id": "gpt-5-nano", + "name": "gpt-5-nano", + "display_name": "gpt-5-nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-10-24", - "last_updated": "2025-10-24", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "kuaishou/kat-coder-pro-v1-free", - "name": "KwaiKAT: KAT-Coder-Pro-V1 Free", - "display_name": "KwaiKAT: KAT-Coder-Pro-V1 Free", + "id": "gpt-5-pro", + "name": "gpt-5-pro", + "display_name": "gpt-5-pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 400000, + "output": 272000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-10-24", - "last_updated": "2025-10-24", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true }, "type": "chat" }, { - "id": "meta/llama-3.3-70b-instruct", - "name": "Meta: Llama 3.3 70B Instruct", - "display_name": "Meta: Llama 3.3 70B Instruct", + "id": "gpt-5.1", + "name": "gpt-5.1", + "display_name": "gpt-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2024-11-26", - "last_updated": "2024-11-26", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true }, "type": "chat" }, { - "id": "meta/llama-4-scout-17b-16e-instruct", - "name": "Meta: Llama 4 Scout Instruct", - "display_name": "Meta: Llama 4 Scout Instruct", + "id": "gpt-5.1-chat-latest", + "name": "gpt-5.1-chat-latest", + "display_name": "gpt-5.1-chat-latest", "modalities": { "input": [ "text", @@ -97327,97 +108031,67 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 16000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-02", - "release_date": "2025-04-02", - "last_updated": "2025-04-02", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true }, "type": "chat" }, { - "id": "minimax/minimax-m2", - "name": "MiniMax: MiniMax M2", - "display_name": "MiniMax: MiniMax M2", + "id": "gpt-5.1-codex", + "name": "gpt-5.1-codex", + "display_name": "gpt-5.1-codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 205000, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-10-27", - "last_updated": "2025-10-27", - "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.38 - }, "type": "chat" }, { - "id": "minimax/minimax-m2.1", - "name": "MiniMax: MiniMax M2.1", - "display_name": "MiniMax: MiniMax M2.1", + "id": "gpt-5.1-codex-max", + "name": "gpt-5.1-codex-max", + "display_name": "gpt-5.1-codex-max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-12-23", - "last_updated": "2025-12-23", - "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 - }, "type": "chat" }, { - "id": "mistralai/mistral-large-2512", - "name": "Mistral: Mistral Large 3", - "display_name": "Mistral: Mistral Large 3", + "id": "gpt-5.1-codex-mini", + "name": "gpt-5.1-codex-mini", + "display_name": "gpt-5.1-codex-mini", "modalities": { "input": [ "text", @@ -97428,39 +108102,31 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2025-12-02", - "cost": { - "input": 0.5, - "output": 1.5 + "supported": true, + "default": true }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-0711", - "name": "MoonshotAI: Kimi K2 0711", - "display_name": "MoonshotAI: Kimi K2 0711", + "id": "gpt-5.2", + "name": "gpt-5.2", + "display_name": "gpt-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 400000, "output": 128000 }, "tool_call": true, @@ -97470,111 +108136,103 @@ "type": "chat" }, { - "id": "moonshotai/kimi-k2-0905", - "name": "MoonshotAI: Kimi K2 0905", - "display_name": "MoonshotAI: Kimi K2 0905", + "id": "gpt-5.2-chat-latest", + "name": "gpt-5.2-chat-latest", + "display_name": "gpt-5.2-chat-latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 16000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-09-09", - "last_updated": "2025-09-09", - "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 - }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking", - "name": "MoonshotAI: Kimi K2 Thinking", - "display_name": "MoonshotAI: Kimi K2 Thinking", + "id": "gpt-5.2-codex", + "name": "gpt-5.2-codex", + "display_name": "gpt-5.2-codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-11", - "last_updated": "2025-12", - "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking-turbo", - "name": "MoonshotAI: Kimi K2 Thinking Turbo", - "display_name": "MoonshotAI: Kimi K2 Thinking Turbo", + "id": "gpt-5.2-pro", + "name": "gpt-5.2-pro", + "display_name": "gpt-5.2-pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", - "cost": { - "input": 1.15, - "output": 8, - "cache_read": 0.15 + "type": "chat" + }, + { + "id": "grok-3", + "name": "grok-3", + "display_name": "grok-3", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 32000 + }, + "tool_call": true, + "reasoning": { + "supported": false }, "type": "chat" }, { - "id": "openai/gpt-4.1", - "name": "OpenAI: GPT-4.1", - "display_name": "OpenAI: GPT-4.1", + "id": "grok-3-mini", + "name": "grok-3-mini", + "display_name": "grok-3-mini", "modalities": { "input": [ "text", @@ -97585,30 +108243,19 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 131072, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 - }, "type": "chat" }, { - "id": "openai/gpt-4.1-mini", - "name": "OpenAI: GPT-4.1 Mini", - "display_name": "OpenAI: GPT-4.1 Mini", + "id": "grok-4-0709", + "name": "grok-4-0709", + "display_name": "grok-4-0709", "modalities": { "input": [ "text", @@ -97619,30 +108266,19 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 256000, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 - }, "type": "chat" }, { - "id": "openai/gpt-4.1-nano", - "name": "OpenAI: GPT-4.1 Nano", - "display_name": "OpenAI: GPT-4.1 Nano", + "id": "grok-4-1-fast-non-reasoning", + "name": "grok-4-1-fast-non-reasoning", + "display_name": "grok-4-1-fast-non-reasoning", "modalities": { "input": [ "text", @@ -97653,30 +108289,19 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 2000000, + "output": 2000000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.03 - }, "type": "chat" }, { - "id": "openai/gpt-4o", - "name": "OpenAI: GPT-4o", - "display_name": "OpenAI: GPT-4o", + "id": "grok-4-1-fast-reasoning", + "name": "grok-4-1-fast-reasoning", + "display_name": "grok-4-1-fast-reasoning", "modalities": { "input": [ "text", @@ -97687,30 +108312,19 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 2000000, + "output": 2000000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", - "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 - }, "type": "chat" }, { - "id": "openai/gpt-4o-mini", - "name": "OpenAI: GPT-4o-mini", - "display_name": "OpenAI: GPT-4o-mini", + "id": "grok-4-fast-non-reasoning", + "name": "grok-4-fast-non-reasoning", + "display_name": "grok-4-fast-non-reasoning", "modalities": { "input": [ "text", @@ -97721,30 +108335,19 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 2000000, + "output": 2000000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", - "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 - }, "type": "chat" }, { - "id": "openai/gpt-5", - "name": "OpenAI: GPT-5", - "display_name": "OpenAI: GPT-5", + "id": "grok-4-fast-reasoning", + "name": "grok-4-fast-reasoning", + "display_name": "grok-4-fast-reasoning", "modalities": { "input": [ "text", @@ -97755,45 +108358,19 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 2000000, + "output": 2000000 }, - "temperature": false, "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 - }, - "type": "chat" - }, - { - "id": "openai/gpt-5-chat", - "name": "OpenAI: GPT-5 Chat", - "display_name": "OpenAI: GPT-5 Chat", - "limit": { - "context": 272000, - "output": 16384 - }, - "tool_call": false, "reasoning": { "supported": false }, "type": "chat" }, { - "id": "openai/gpt-5-codex", - "name": "OpenAI: GPT-5 Codex", - "display_name": "OpenAI: GPT-5 Codex", + "id": "grok-code-fast-1", + "name": "grok-code-fast-1", + "display_name": "grok-code-fast-1", "modalities": { "input": [ "text", @@ -97804,172 +108381,112 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 256000 }, - "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "supported": false }, "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "OpenAI: GPT-5 Mini", - "display_name": "OpenAI: GPT-5 Mini", + "id": "moonshotai/kimi-k2-0905", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 262144 }, - "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.03 + "supported": false }, "type": "chat" }, { - "id": "openai/gpt-5-nano", - "name": "OpenAI: GPT-5 Nano", - "display_name": "OpenAI: GPT-5 Nano", + "id": "moonshotai/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 131072 }, - "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.01 + "supported": false }, "type": "chat" }, { - "id": "openai/gpt-5-pro", - "name": "OpenAI: GPT-5 Pro", - "display_name": "OpenAI: GPT-5 Pro", + "id": "moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 262144 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-06", - "last_updated": "2025-10-06", - "cost": { - "input": 14, - "output": 110 - }, "type": "chat" }, { - "id": "openai/gpt-5.1", - "name": "OpenAI: GPT-5.1", - "display_name": "OpenAI: GPT-5.1", + "id": "sao10k/l3-70b-euryale-v2.1", + "name": "L3 70B Euryale V2.1", + "display_name": "L3 70B Euryale V2.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 8192, + "output": 8192 }, - "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "supported": false }, "type": "chat" }, { - "id": "openai/gpt-5.1-chat", - "name": "OpenAI: GPT-5.1 Chat", - "display_name": "OpenAI: GPT-5.1 Chat", + "id": "Sao10K/L3-8B-Stheno-v3.2", + "name": "L3 8B Stheno V3.2", + "display_name": "L3 8B Stheno V3.2", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -97977,68 +108494,43 @@ ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 8192, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 - }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex", - "name": "OpenAI: GPT-5.1-Codex", - "display_name": "OpenAI: GPT-5.1-Codex", + "id": "sao10k/l31-70b-euryale-v2.2", + "name": "L31 70B Euryale V2.2", + "display_name": "L31 70B Euryale V2.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 8192, + "output": 8192 }, - "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "supported": false }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-mini", - "name": "OpenAI: GPT-5.1-Codex-Mini", - "display_name": "OpenAI: GPT-5.1-Codex-Mini", + "id": "meta-llama/llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -98046,101 +108538,63 @@ ] }, "limit": { - "context": 400000, - "output": 64000 + "context": 16384, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", - "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.03 + "supported": false }, "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "OpenAI: GPT-5.2", - "display_name": "OpenAI: GPT-5.2", + "id": "meta-llama/llama-3.2-3b-instruct", + "name": "Llama 3.2 3B Instruct", + "display_name": "Llama 3.2 3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32768, + "output": 32000 }, - "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", - "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "supported": false }, "type": "chat" }, { - "id": "openai/gpt-5.2-chat", - "name": "OpenAI: GPT-5.2 Chat", - "display_name": "OpenAI: GPT-5.2 Chat", + "id": "meta-llama/llama-3.3-70b-instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 120000 }, - "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", - "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "supported": false }, "type": "chat" }, { - "id": "openai/gpt-5.2-pro", - "name": "OpenAI: GPT-5.2 Pro", - "display_name": "OpenAI: GPT-5.2 Pro", + "id": "meta-llama/llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama 4 Maverick Instruct", + "display_name": "Llama 4 Maverick Instruct", "modalities": { "input": [ "text", @@ -98151,29 +108605,19 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 1048576 }, - "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2025-12-11", - "cost": { - "input": 19, - "output": 150 + "supported": false }, "type": "chat" }, { - "id": "openai/o4-mini", - "name": "OpenAI: o4 Mini", - "display_name": "OpenAI: o4 Mini", + "id": "meta-llama/llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout Instruct", + "display_name": "Llama 4 Scout Instruct", "modalities": { "input": [ "text", @@ -98184,31 +108628,19 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 131072 }, - "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", - "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 + "supported": false }, "type": "chat" }, { - "id": "qwen/qwen3-14b", - "name": "Qwen: Qwen3 14B", - "display_name": "Qwen: Qwen3 14B", + "id": "minimaxai/minimax-m1-80k", + "name": "MiniMax M1", + "display_name": "MiniMax M1", "modalities": { "input": [ "text" @@ -98218,28 +108650,20 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 40000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", - "cost": { - "input": 0.07, - "output": 0.28 + "supported": true, + "default": true }, "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-2507", - "name": "Qwen: Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen: Qwen3 235B A22B Instruct 2507", + "id": "minimax/minimax-m2.1", + "name": "Minimax M2.1", + "display_name": "Minimax M2.1", "modalities": { "input": [ "text" @@ -98249,8 +108673,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 204800, + "output": 131072 }, "tool_call": true, "reasoning": { @@ -98260,9 +108684,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-thinking-2507", - "name": "Qwen: Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen: Qwen3 235B A22B Thinking 2507", + "id": "mistralai/mistral-7b-instruct", + "name": "Mistral 7B Instruct", + "display_name": "Mistral 7B Instruct", "modalities": { "input": [ "text" @@ -98272,30 +108696,19 @@ ] }, "limit": { - "context": 262144, + "context": 32768, "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-25", - "last_updated": "2025-10-04", - "cost": { - "input": 0.2, - "output": 0.8 + "supported": false }, "type": "chat" }, { - "id": "qwen/qwen3-max-preview", - "name": "Qwen: Qwen3 Max Thinking Preview", - "display_name": "Qwen: Qwen3 Max Thinking Preview", + "id": "mistralai/mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text" @@ -98305,21 +108718,19 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 60288, + "output": 32000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, "type": "chat" }, { - "id": "qwen/qwen3-coder", - "name": "Qwen: Qwen3-Coder", - "display_name": "Qwen: Qwen3-Coder", + "id": "gryphe/mythomax-l2-13b", + "name": "Mythomax L2 13B", + "display_name": "Mythomax L2 13B", "modalities": { "input": [ "text" @@ -98329,74 +108740,54 @@ ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 4096, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", - "cost": { - "input": 0.3, - "output": 1.2 - }, "type": "chat" }, { - "id": "qwen/qwen3-coder-plus", - "name": "Qwen: Qwen3-Coder-Plus", - "display_name": "Qwen: Qwen3-Coder-Plus", + "id": "nova-2-Lite", + "name": "nova-2-Lite", + "display_name": "nova-2-Lite", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 1000000, + "output": 1000000 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-09-10", - "last_updated": "2025-09-10", - "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 - }, "type": "chat" }, { - "id": "qwen/qwen3-max", - "name": "Qwen: Qwen3-Max", - "display_name": "Qwen: Qwen3-Max", + "id": "o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 131072, + "output": 131072 }, "tool_call": true, "reasoning": { @@ -98405,9 +108796,9 @@ "type": "chat" }, { - "id": "qwen/qwen3-vl-plus", - "name": "Qwen: Qwen3-VL-Plus", - "display_name": "Qwen: Qwen3-VL-Plus", + "id": "o1-mini", + "name": "o1-mini", + "display_name": "o1-mini", "modalities": { "input": [ "text", @@ -98418,105 +108809,89 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "stepfun/step-3", - "name": "StepFun: Step-3", - "display_name": "StepFun: Step-3", + "id": "o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 64000 + "context": 131072, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-12-18", - "last_updated": "2025-12-18", - "cost": { - "input": 0.21, - "output": 0.57 + "supported": false }, "type": "chat" }, { - "id": "volcengine/doubao-seed-1-6-vision", - "name": "VolcanoEngine: Doubao-Seed-1.6-vision", - "display_name": "VolcanoEngine: Doubao-Seed-1.6-vision", + "id": "o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, "limit": { - "context": 256000, - "output": 32000 + "context": 131072, + "output": 131072 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "type": "chat" }, { - "id": "volcengine/doubao-seed-1.8", - "name": "VolcanoEngine: Doubao-Seed-1.8", - "display_name": "VolcanoEngine: Doubao-Seed-1.8", + "id": "openai/gpt-oss-120b", + "name": "OpenAI GPT OSS 120B", + "display_name": "OpenAI GPT OSS 120B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 131072, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-12-18", - "last_updated": "2025-12-18", - "cost": { - "input": 0.11, - "output": 0.28, - "cache_read": 0.02, - "cache_write": 0 - }, "type": "chat" }, { - "id": "volcengine/doubao-seed-code", - "name": "VolcanoEngine: Doubao-Seed-Code", - "display_name": "VolcanoEngine: Doubao-Seed-Code", + "id": "openai/gpt-oss-20b", + "name": "OpenAI: GPT OSS 20B", + "display_name": "OpenAI: GPT OSS 20B", "modalities": { "input": [ "text", @@ -98527,31 +108902,20 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 131072, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-11-11", - "last_updated": "2025-11-11", - "cost": { - "input": 0.17, - "output": 1.12, - "cache_read": 0.03 - }, "type": "chat" }, { - "id": "x-ai/grok-4", - "name": "xAI: Grok 4", - "display_name": "xAI: Grok 4", + "id": "qwen/qwen-2.5-72b-instruct", + "name": "Qwen 2.5 72B Instruct", + "display_name": "Qwen 2.5 72B Instruct", "modalities": { "input": [ "text" @@ -98561,170 +108925,110 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 32000, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75, - "cache_write": 15 + "supported": false }, "type": "chat" }, { - "id": "x-ai/grok-4-fast", - "name": "xAI: Grok 4 Fast", - "display_name": "xAI: Grok 4 Fast", + "id": "qwen/qwen-mt-plus", + "name": "Qwen MT Plus", + "display_name": "Qwen MT Plus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 4096, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", - "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "supported": false }, "type": "chat" }, { - "id": "x-ai/grok-4-fast-non-reasoning", - "name": "xAI: Grok 4 Fast None Reasoning", - "display_name": "xAI: Grok 4 Fast None Reasoning", + "id": "qwen/qwen2.5-7b-instruct", + "name": "Qwen2.5 7B Instruct", + "display_name": "Qwen2.5 7B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 32000, + "output": 32000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", - "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 - }, "type": "chat" }, { - "id": "x-ai/grok-4.1-fast", - "name": "xAI: Grok 4.1 Fast", - "display_name": "xAI: Grok 4.1 Fast", + "id": "qwen/qwen2.5-vl-72b-instruct", + "name": "Qwen2.5 VL 72B Instruct", + "display_name": "Qwen2.5 VL 72B Instruct", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 64000 + "context": 32768, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-11-20", - "last_updated": "2025-11-20", - "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "supported": false }, "type": "chat" }, { - "id": "x-ai/grok-4.1-fast-non-reasoning", - "name": "xAI: Grok 4.1 Fast Non Reasoning", - "display_name": "xAI: Grok 4.1 Fast Non Reasoning", + "id": "qwen/qwen3-235b-a22b-fp8", + "name": "Qwen3 235B A22B", + "display_name": "Qwen3 235B A22B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 64000 + "context": 40960, + "output": 20000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-11-20", - "last_updated": "2025-11-20", - "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "supported": true, + "default": true }, "type": "chat" }, { - "id": "x-ai/grok-code-fast-1", - "name": "xAI: Grok Code Fast 1", - "display_name": "xAI: Grok Code Fast 1", + "id": "qwen/qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -98734,31 +109038,19 @@ ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 131072, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", - "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "supported": false }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-flash", - "name": "Xiaomi: MiMo-V2-Flash", - "display_name": "Xiaomi: MiMo-V2-Flash", + "id": "qwen/qwen3-235b-a22b-thinking-2507", + "name": "Qwen3 235B A22b Thinking 2507", + "display_name": "Qwen3 235B A22b Thinking 2507", "modalities": { "input": [ "text" @@ -98768,30 +109060,20 @@ ] }, "limit": { - "context": 262144, - "output": 64000 + "context": 131072, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-flash-free", - "name": "Xiaomi: MiMo-V2-Flash Free", - "display_name": "Xiaomi: MiMo-V2-Flash Free", + "id": "qwen/qwen3-30b-a3b-fp8", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", "modalities": { "input": [ "text" @@ -98801,30 +109083,20 @@ ] }, "limit": { - "context": 262144, - "output": 64000 + "context": 40960, + "output": 20000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "z-ai/glm-4.5", - "name": "Z.AI: GLM 4.5", - "display_name": "Z.AI: GLM 4.5", + "id": "qwen/qwen3-32b-fp8", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ "text" @@ -98834,28 +109106,20 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 40960, + "output": 20000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", - "cost": { - "input": 0.4, - "output": 2 + "supported": true, + "default": true }, "type": "chat" }, { - "id": "z-ai/glm-4.5-air", - "name": "Z.AI: GLM 4.5 Air", - "display_name": "Z.AI: GLM 4.5 Air", + "id": "qwen/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" @@ -98865,28 +109129,19 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 262144, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", - "cost": { - "input": 0.14, - "output": 0.86 - }, "type": "chat" }, { - "id": "z-ai/glm-4.6", - "name": "Z.AI: GLM 4.6", - "display_name": "Z.AI: GLM 4.6", + "id": "qwen/qwen3-coder-next", + "name": "Qwen3 Coder Next FP8", + "display_name": "Qwen3 Coder Next FP8", "modalities": { "input": [ "text" @@ -98896,138 +109151,86 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", - "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "supported": false }, "type": "chat" }, { - "id": "z-ai/glm-4.6v", - "name": "Z.AI: GLM 4.6V", - "display_name": "Z.AI: GLM 4.6V", + "id": "qwen/qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 65536, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", - "cost": { - "input": 0.14, - "output": 0.42, - "cache_read": 0.03 + "supported": false }, "type": "chat" }, { - "id": "z-ai/glm-4.6v-flash-free", - "name": "Z.AI: GLM 4.6V Flash (Free)", - "display_name": "Z.AI: GLM 4.6V Flash (Free)", + "id": "qwen/qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 65536, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", - "cost": { - "input": 0, - "output": 0 - }, "type": "chat" }, { - "id": "z-ai/glm-4.6v-flash", - "name": "Z.AI: GLM 4.6V FlashX", - "display_name": "Z.AI: GLM 4.6V FlashX", + "id": "sao10k/l3-8b-lunaris", + "name": "Sao10k L3 8B Lunaris", + "display_name": "Sao10k L3 8B Lunaris", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 8192, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", - "cost": { - "input": 0, - "output": 0 + "supported": false }, "type": "chat" }, { - "id": "z-ai/glm-4.7", - "name": "Z.AI: GLM 4.7", - "display_name": "Z.AI: GLM 4.7", + "id": "xiaomimimo/mimo-v2-flash", + "name": "XiaomiMiMo/MiMo-V2-Flash", + "display_name": "XiaomiMiMo/MiMo-V2-Flash", "modalities": { "input": [ "text" @@ -99037,25 +109240,14 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2025-12-23", - "last_updated": "2025-12-23", - "cost": { - "input": 0.28, - "output": 1.14, - "cache_read": 0.06 - }, "type": "chat" } ] diff --git a/src/main/presenter/configPresenter/index.ts b/src/main/presenter/configPresenter/index.ts index 01ead3eef..3376d958b 100644 --- a/src/main/presenter/configPresenter/index.ts +++ b/src/main/presenter/configPresenter/index.ts @@ -434,6 +434,34 @@ export class ConfigPresenter implements IConfigPresenter { console.warn('Failed to migrate legacy default_system_prompt:', e) } } + + // Before version 0.5.8, split OpenAI Responses and OpenAI Completions semantics + if (oldVersion && compare(oldVersion, '0.5.8', '<')) { + const providers = this.getProviders() + let hasChanges = false + + const migratedProviders = providers.map((provider) => { + if (provider.apiType === 'openai-compatible') { + hasChanges = true + return { ...provider, apiType: 'openai-completions' } + } + + if ( + provider.id !== 'openai' && + provider.id !== 'minimax' && + provider.apiType === 'openai' + ) { + hasChanges = true + return { ...provider, apiType: 'openai-completions' } + } + + return provider + }) + + if (hasChanges) { + this.setProviders(migratedProviders) + } + } } private migrateMinimaxProvider(): void { diff --git a/src/main/presenter/configPresenter/providers.ts b/src/main/presenter/configPresenter/providers.ts index db04a89d4..13bcc84ed 100644 --- a/src/main/presenter/configPresenter/providers.ts +++ b/src/main/presenter/configPresenter/providers.ts @@ -34,7 +34,7 @@ export const DEFAULT_PROVIDERS: LLM_PROVIDER_BASE[] = [ { id: 'qiniu', name: 'Qiniu', - apiType: 'openai', + apiType: 'openai-completions', apiKey: '', baseUrl: 'https://api.qnaigc.com/v1', enable: false, @@ -80,7 +80,7 @@ export const DEFAULT_PROVIDERS: LLM_PROVIDER_BASE[] = [ { id: 'ppio', name: 'PPIO', - apiType: 'openai', + apiType: 'openai-completions', apiKey: '', baseUrl: 'https://api.ppinfra.com/v3/openai', enable: false, @@ -128,7 +128,7 @@ export const DEFAULT_PROVIDERS: LLM_PROVIDER_BASE[] = [ { id: 'tokenflux', name: 'TokenFlux', - apiType: 'openai', + apiType: 'openai-completions', apiKey: '', baseUrl: 'https://tokenflux.ai/v1', enable: false, @@ -144,7 +144,7 @@ export const DEFAULT_PROVIDERS: LLM_PROVIDER_BASE[] = [ { id: 'burncloud', name: 'BurnCloud', - apiType: 'openai', + apiType: 'openai-completions', apiKey: '', baseUrl: 'https://ai.burncloud.com', enable: false, @@ -280,7 +280,7 @@ export const DEFAULT_PROVIDERS: LLM_PROVIDER_BASE[] = [ { id: 'openrouter', name: 'OpenRouter', - apiType: 'openai', + apiType: 'openai-completions', apiKey: '', baseUrl: 'https://openrouter.ai/api/v1/', enable: false, @@ -310,7 +310,7 @@ export const DEFAULT_PROVIDERS: LLM_PROVIDER_BASE[] = [ { id: '302ai', name: '302.AI', - apiType: 'openai', + apiType: 'openai-completions', apiKey: '', baseUrl: 'https://api.302.ai/v1', enable: false, @@ -370,7 +370,7 @@ export const DEFAULT_PROVIDERS: LLM_PROVIDER_BASE[] = [ { id: 'github', name: 'GitHub Models', - apiType: 'openai', + apiType: 'openai-completions', apiKey: '', baseUrl: 'https://models.inference.ai.azure.com', enable: false, @@ -476,7 +476,7 @@ export const DEFAULT_PROVIDERS: LLM_PROVIDER_BASE[] = [ { id: 'moonshot', name: 'Moonshot', - apiType: 'openai', + apiType: 'openai-completions', apiKey: '', baseUrl: 'https://api.moonshot.cn/v1', enable: false, @@ -628,7 +628,7 @@ export const DEFAULT_PROVIDERS: LLM_PROVIDER_BASE[] = [ { id: 'aihubmix', name: 'AIHubMix', - apiType: 'openai', + apiType: 'openai-completions', apiKey: '', baseUrl: 'https://aihubmix.com/v1', enable: false, @@ -673,7 +673,7 @@ export const DEFAULT_PROVIDERS: LLM_PROVIDER_BASE[] = [ { id: 'hunyuan', name: 'Hunyuan', - apiType: 'openai', + apiType: 'openai-completions', apiKey: '', baseUrl: 'https://api.hunyuan.cloud.tencent.com/v1', enable: false, @@ -703,7 +703,7 @@ export const DEFAULT_PROVIDERS: LLM_PROVIDER_BASE[] = [ { id: 'azure-openai', name: 'Azure OpenAI', - apiType: 'openai', + apiType: 'openai-completions', apiKey: '', baseUrl: '', enable: false, @@ -720,7 +720,7 @@ export const DEFAULT_PROVIDERS: LLM_PROVIDER_BASE[] = [ { id: 'modelscope', name: 'ModelScope', - apiType: 'openai', + apiType: 'openai-completions', apiKey: '', baseUrl: 'https://api-inference.modelscope.cn/v1/', enable: false, @@ -750,7 +750,7 @@ export const DEFAULT_PROVIDERS: LLM_PROVIDER_BASE[] = [ { id: 'xiaomi', name: 'Xiaomi', - apiType: 'openai', + apiType: 'openai-completions', apiKey: '', baseUrl: 'https://api.xiaomimimo.com/v1', enable: false, diff --git a/src/main/presenter/llmProviderPresenter/managers/providerInstanceManager.ts b/src/main/presenter/llmProviderPresenter/managers/providerInstanceManager.ts index 49900bb4a..f15f2a1ee 100644 --- a/src/main/presenter/llmProviderPresenter/managers/providerInstanceManager.ts +++ b/src/main/presenter/llmProviderPresenter/managers/providerInstanceManager.ts @@ -1,7 +1,6 @@ import { ProviderBatchUpdate, ProviderChange } from '@shared/provider-operations' import { IConfigPresenter, LLM_PROVIDER } from '@shared/presenter' import { BaseLLMProvider } from '../baseProvider' -import { OpenAIProvider } from '../providers/openAIProvider' import { DeepseekProvider } from '../providers/deepseekProvider' import { SiliconcloudProvider } from '../providers/siliconcloudProvider' import { DashscopeProvider } from '../providers/dashscopeProvider' @@ -85,7 +84,7 @@ export class ProviderInstanceManager { ['ollama', OllamaProvider], ['anthropic', AnthropicProvider], ['doubao', DoubaoProvider], - ['openai', OpenAIProvider], + ['openai', OpenAIResponsesProvider], ['voiceai', VoiceAIProvider], ['openai-responses', OpenAIResponsesProvider], ['cherryin', CherryInProvider], @@ -118,7 +117,8 @@ export class ProviderInstanceManager { ['ollama', OllamaProvider], ['anthropic', AnthropicProvider], ['doubao', DoubaoProvider], - ['openai', OpenAIProvider], + ['openai', OpenAIResponsesProvider], + ['openai-completions', OpenAICompatibleProvider], ['voiceai', VoiceAIProvider], ['openai-compatible', OpenAICompatibleProvider], ['openai-responses', OpenAIResponsesProvider], diff --git a/src/renderer/settings/components/AddCustomProviderDialog.vue b/src/renderer/settings/components/AddCustomProviderDialog.vue index 6ee34af7e..f60626a94 100644 --- a/src/renderer/settings/components/AddCustomProviderDialog.vue +++ b/src/renderer/settings/components/AddCustomProviderDialog.vue @@ -33,7 +33,7 @@ OpenAI - OpenAI Responses + OpenAI Completions Gemini Anthropic Ollama @@ -69,8 +69,8 @@ :placeholder="t('settings.provider.dialog.addCustomProvider.baseUrlPlaceholder')" required /> -
- {{ `${formData.baseUrl ?? ''}/chat/completions` }} +
+ {{ `${formData.baseUrl ?? ''}${apiEndpointSuffix}` }}
@@ -100,7 +100,7 @@ diff --git a/src/renderer/settings/main.ts b/src/renderer/settings/main.ts index 0b232988c..679f19971 100644 --- a/src/renderer/settings/main.ts +++ b/src/renderer/settings/main.ts @@ -82,6 +82,16 @@ const router = createRouter({ position: 6 } }, + { + path: '/notifications-hooks', + name: 'settings-notifications-hooks', + component: () => import('./components/NotificationsHooksSettings.vue'), + meta: { + titleKey: 'routes.settings-notifications-hooks', + icon: 'lucide:bell', + position: 6.5 + } + }, { path: '/skills', name: 'settings-skills', diff --git a/src/renderer/src/i18n/da-DK/routes.json b/src/renderer/src/i18n/da-DK/routes.json index e895b716a..4627e8d05 100644 --- a/src/renderer/src/i18n/da-DK/routes.json +++ b/src/renderer/src/i18n/da-DK/routes.json @@ -14,5 +14,6 @@ "settings-prompt": "Prompter", "settings-mcp-market": "MCP-marked", "settings-acp": "ACP-agenter", - "settings-skills": "Skills" + "settings-skills": "Skills", + "settings-notifications-hooks": "Notifikationer og Hooks" } diff --git a/src/renderer/src/i18n/da-DK/settings.json b/src/renderer/src/i18n/da-DK/settings.json index 6c92db318..5d3fae559 100644 --- a/src/renderer/src/i18n/da-DK/settings.json +++ b/src/renderer/src/i18n/da-DK/settings.json @@ -1225,5 +1225,59 @@ "title": "Eksterne værktøjer" }, "title": "Færdighedsstyring" + }, + "notificationsHooks": { + "commands": { + "commandPlaceholder": "Kommandoen der skal udføres", + "description": "Udfør kommandoen for hver begivenhed.", + "hint": "Skriv payload som JSON til stdin.", + "title": "Hooks kommandoer" + }, + "confirmo": { + "description": "Send notifikationer via Confirmo Hook (standard sender alle begivenheder).", + "title": "Confirmo", + "unavailable": "Confirmo Hook ikke fundet: {path}" + }, + "description": "Konfigurer webhook-notifikationer og livscyklus-hooks.", + "discord": { + "description": "Send notifikationer via Discord webhook.", + "title": "Discord", + "webhookUrl": "Webhook-URL", + "webhookUrlPlaceholder": "https://discord.com/api/webhooks/..." + }, + "events": { + "PermissionRequest": "Tilladelsesforespørgsel", + "PostToolUse": "Efter værktøjskald", + "PostToolUseFailure": "Værktøjsopkald mislykkedes", + "PreToolUse": "Før værktøjskald", + "SessionEnd": "Samtalen er slut", + "SessionStart": "Samtalen starter", + "Stop": "stop", + "UserPromptSubmit": "Brugerindsendelse", + "title": "begivenhed" + }, + "telegram": { + "botToken": "Bot-token", + "botTokenPlaceholder": "Telegram Bot Token", + "chatId": "Chat-ID", + "chatIdPlaceholder": "For eksempel 123456789", + "description": "Send notifikationer via Telegram Bot.", + "threadId": "Trådid (valgfri)", + "threadIdPlaceholder": "Valgfri tråd-ID", + "title": "Telegram" + }, + "test": { + "button": "Test", + "duration": "{ms} ms", + "exitCode": "Afslutningskode {code}", + "failed": "mislykkelse", + "retryAfter": "Prøv igen om {ms} ms", + "statusCode": "HTTP {code}", + "stderr": "stderr", + "stdout": "stdout", + "success": "succes", + "testing": "Tester..." + }, + "title": "Notifikationer og Hooks" } } diff --git a/src/renderer/src/i18n/en-US/routes.json b/src/renderer/src/i18n/en-US/routes.json index 0b9c13798..22c2af75b 100644 --- a/src/renderer/src/i18n/en-US/routes.json +++ b/src/renderer/src/i18n/en-US/routes.json @@ -14,5 +14,6 @@ "settings-prompt": "Prompts", "settings-mcp-market": "MCP Market", "settings-acp": "ACP Agents", - "settings-skills": "Skills" + "settings-skills": "Skills", + "settings-notifications-hooks": "Notifications & Hooks" } diff --git a/src/renderer/src/i18n/en-US/settings.json b/src/renderer/src/i18n/en-US/settings.json index 679e86298..fa84e3210 100644 --- a/src/renderer/src/i18n/en-US/settings.json +++ b/src/renderer/src/i18n/en-US/settings.json @@ -64,6 +64,60 @@ "fileMaxSize": "File Maximum Size", "fileMaxSizeHint": "Limits the maximum size of a single uploaded file" }, + "notificationsHooks": { + "title": "Notifications & Hooks", + "description": "Configure webhook notifications and lifecycle hooks.", + "events": { + "title": "Events", + "SessionStart": "Session Start", + "UserPromptSubmit": "User Prompt Submit", + "PreToolUse": "Pre Tool Use", + "PostToolUse": "Post Tool Use", + "PostToolUseFailure": "Tool Use Failure", + "PermissionRequest": "Permission Request", + "Stop": "Stop", + "SessionEnd": "Session End" + }, + "telegram": { + "title": "Telegram", + "description": "Send notifications via Telegram bot.", + "botToken": "Bot Token", + "botTokenPlaceholder": "Telegram bot token", + "chatId": "Chat ID", + "chatIdPlaceholder": "e.g. 123456789", + "threadId": "Thread ID (optional)", + "threadIdPlaceholder": "Optional thread ID" + }, + "discord": { + "title": "Discord", + "description": "Send notifications via Discord webhook.", + "webhookUrl": "Webhook URL", + "webhookUrlPlaceholder": "https://discord.com/api/webhooks/..." + }, + "confirmo": { + "title": "Confirmo", + "description": "Send notifications via Confirmo hook (all events).", + "unavailable": "Confirmo hook not found: {path}" + }, + "commands": { + "title": "Hooks Commands", + "description": "Run a command for each event.", + "hint": "The payload is sent to stdin as JSON.", + "commandPlaceholder": "Command to run" + }, + "test": { + "button": "Test", + "testing": "Testing...", + "success": "Success", + "failed": "Failed", + "duration": "{ms} ms", + "statusCode": "HTTP {code}", + "exitCode": "Exit {code}", + "retryAfter": "Retry after {ms} ms", + "stdout": "stdout", + "stderr": "stderr" + } + }, "data": { "title": "Data Settings", "syncEnable": "Enable Data Sync", diff --git a/src/renderer/src/i18n/fa-IR/routes.json b/src/renderer/src/i18n/fa-IR/routes.json index c1dff647d..7a357ab11 100644 --- a/src/renderer/src/i18n/fa-IR/routes.json +++ b/src/renderer/src/i18n/fa-IR/routes.json @@ -14,5 +14,6 @@ "settings-prompt": "مدیریت پرامپت‌ها", "settings-mcp-market": "بازار MCP", "settings-acp": "نماینده ACP", - "settings-skills": "Skills" + "settings-skills": "Skills", + "settings-notifications-hooks": "اعلان‌ها و هوک‌ها" } diff --git a/src/renderer/src/i18n/fa-IR/settings.json b/src/renderer/src/i18n/fa-IR/settings.json index 8c276df34..d1dd42317 100644 --- a/src/renderer/src/i18n/fa-IR/settings.json +++ b/src/renderer/src/i18n/fa-IR/settings.json @@ -64,6 +64,60 @@ "fileMaxSize": "حداکثر اندازه فایل", "fileMaxSizeHint": "حداکثر اندازه یک فایل قابل آپلود را محدود می‌کند" }, + "notificationsHooks": { + "title": "اعلان‌ها و هوک‌ها", + "description": "پیکربندی اعلان‌های وب‌هوک و هوک‌های چرخهٔ عمر.", + "events": { + "title": "رویدادها", + "SessionStart": "شروع نشست", + "UserPromptSubmit": "ارسال پرامپت کاربر", + "PreToolUse": "پیش از استفاده از ابزار", + "PostToolUse": "پس از استفاده از ابزار", + "PostToolUseFailure": "شکست استفاده از ابزار", + "PermissionRequest": "درخواست اجازه", + "Stop": "توقف", + "SessionEnd": "پایان نشست" + }, + "telegram": { + "title": "Telegram", + "description": "ارسال اعلان‌ها از طریق ربات تلگرام.", + "botToken": "توکن ربات", + "botTokenPlaceholder": "توکن ربات تلگرام", + "chatId": "شناسهٔ گفتگو", + "chatIdPlaceholder": "مثلاً 123456789", + "threadId": "شناسهٔ رشته (اختیاری)", + "threadIdPlaceholder": "شناسهٔ رشتهٔ اختیاری" + }, + "discord": { + "title": "Discord", + "description": "ارسال اعلان‌ها از طریق وب‌هوک دیسکورد.", + "webhookUrl": "نشانی وب‌هوک", + "webhookUrlPlaceholder": "https://discord.com/api/webhooks/..." + }, + "confirmo": { + "title": "Confirmo", + "description": "ارسال اعلان‌ها از طریق هوک Confirmo (همهٔ رویدادها).", + "unavailable": "هوک Confirmo یافت نشد: {path}" + }, + "commands": { + "title": "فرمان‌های هوک", + "description": "برای هر رویداد یک فرمان اجرا شود.", + "hint": "محتوا به‌صورت JSON به stdin فرستاده می‌شود.", + "commandPlaceholder": "فرمان برای اجرا" + }, + "test": { + "button": "آزمون", + "testing": "در حال آزمون...", + "success": "موفق", + "failed": "ناموفق", + "duration": "{ms} ms", + "statusCode": "HTTP {code}", + "exitCode": "کد خروج {code}", + "retryAfter": "تلاش دوباره پس از {ms} ms", + "stdout": "stdout", + "stderr": "stderr" + } + }, "data": { "title": "تنظیمات داده", "syncEnable": "روشن کردن همگام‌سازی داده", diff --git a/src/renderer/src/i18n/fr-FR/routes.json b/src/renderer/src/i18n/fr-FR/routes.json index 44db0798e..bb8d802a1 100644 --- a/src/renderer/src/i18n/fr-FR/routes.json +++ b/src/renderer/src/i18n/fr-FR/routes.json @@ -14,5 +14,6 @@ "settings-prompt": "Gestion des Prompts", "settings-mcp-market": "Marché MCP", "settings-acp": "Agent ACP", - "settings-skills": "Skills" + "settings-skills": "Skills", + "settings-notifications-hooks": "Notifications et hooks" } diff --git a/src/renderer/src/i18n/fr-FR/settings.json b/src/renderer/src/i18n/fr-FR/settings.json index 5d48d640d..66fb8ea86 100644 --- a/src/renderer/src/i18n/fr-FR/settings.json +++ b/src/renderer/src/i18n/fr-FR/settings.json @@ -64,6 +64,60 @@ "fileMaxSize": "Taille maximale du fichier", "fileMaxSizeHint": "Limite la taille maximale d'un fichier à télécharger" }, + "notificationsHooks": { + "title": "Notifications et hooks", + "description": "Configurer les notifications webhook et les hooks du cycle de vie.", + "events": { + "title": "Événements", + "SessionStart": "Début de session", + "UserPromptSubmit": "Envoi du prompt utilisateur", + "PreToolUse": "Avant l’utilisation d’un outil", + "PostToolUse": "Après l’utilisation d’un outil", + "PostToolUseFailure": "Échec d’utilisation d’un outil", + "PermissionRequest": "Demande d’autorisation", + "Stop": "Arrêt", + "SessionEnd": "Fin de session" + }, + "telegram": { + "title": "Telegram", + "description": "Envoyer des notifications via un bot Telegram.", + "botToken": "Jeton du bot", + "botTokenPlaceholder": "Jeton du bot Telegram", + "chatId": "ID du chat", + "chatIdPlaceholder": "ex. 123456789", + "threadId": "ID du fil (optionnel)", + "threadIdPlaceholder": "ID du fil optionnel" + }, + "discord": { + "title": "Discord", + "description": "Envoyer des notifications via un webhook Discord.", + "webhookUrl": "URL du webhook", + "webhookUrlPlaceholder": "https://discord.com/api/webhooks/..." + }, + "confirmo": { + "title": "Confirmo", + "description": "Envoyer des notifications via le hook Confirmo (tous les événements).", + "unavailable": "Hook Confirmo introuvable : {path}" + }, + "commands": { + "title": "Commandes de hooks", + "description": "Exécuter une commande pour chaque événement.", + "hint": "La charge utile est envoyée sur stdin au format JSON.", + "commandPlaceholder": "Commande à exécuter" + }, + "test": { + "button": "Tester", + "testing": "Test en cours...", + "success": "Réussi", + "failed": "Échoué", + "duration": "{ms} ms", + "statusCode": "HTTP {code}", + "exitCode": "Code de sortie {code}", + "retryAfter": "Réessayer dans {ms} ms", + "stdout": "stdout", + "stderr": "stderr" + } + }, "data": { "title": "Paramètres des données", "syncEnable": "Activer la synchronisation des données", diff --git a/src/renderer/src/i18n/he-IL/routes.json b/src/renderer/src/i18n/he-IL/routes.json index 167fc7c6a..9e6190e39 100644 --- a/src/renderer/src/i18n/he-IL/routes.json +++ b/src/renderer/src/i18n/he-IL/routes.json @@ -14,5 +14,6 @@ "settings-prompt": "הנחיות (Prompts)", "settings-mcp-market": "חנות MCP", "settings-acp": "סוכני ACP", - "settings-skills": "Skills" + "settings-skills": "Skills", + "settings-notifications-hooks": "התראות ו‑Hooks" } diff --git a/src/renderer/src/i18n/he-IL/settings.json b/src/renderer/src/i18n/he-IL/settings.json index 4cbec87c3..a76e5da83 100644 --- a/src/renderer/src/i18n/he-IL/settings.json +++ b/src/renderer/src/i18n/he-IL/settings.json @@ -64,6 +64,60 @@ "fileMaxSize": "גודל קובץ מקסימלי", "fileMaxSizeHint": "מגביל את הגודל המקסימלי של קובץ בודד המועלה" }, + "notificationsHooks": { + "title": "התראות ו‑Hooks", + "description": "הגדרת התראות webhook ו‑hooks של מחזור החיים.", + "events": { + "title": "אירועים", + "SessionStart": "תחילת סשן", + "UserPromptSubmit": "שליחת פרומפט משתמש", + "PreToolUse": "לפני שימוש בכלי", + "PostToolUse": "אחרי שימוש בכלי", + "PostToolUseFailure": "כשל בשימוש בכלי", + "PermissionRequest": "בקשת הרשאה", + "Stop": "עצירה", + "SessionEnd": "סיום סשן" + }, + "telegram": { + "title": "Telegram", + "description": "שליחת התראות דרך בוט טלגרם.", + "botToken": "טוקן בוט", + "botTokenPlaceholder": "טוקן בוט טלגרם", + "chatId": "מזהה צ׳אט", + "chatIdPlaceholder": "למשל 123456789", + "threadId": "מזהה שרשור (אופציונלי)", + "threadIdPlaceholder": "מזהה שרשור אופציונלי" + }, + "discord": { + "title": "Discord", + "description": "שליחת התראות דרך webhook של Discord.", + "webhookUrl": "URL של Webhook", + "webhookUrlPlaceholder": "https://discord.com/api/webhooks/..." + }, + "confirmo": { + "title": "Confirmo", + "description": "שליחת התראות דרך hook של Confirmo (כל האירועים).", + "unavailable": "ה‑hook של Confirmo לא נמצא: {path}" + }, + "commands": { + "title": "פקודות Hooks", + "description": "הרצת פקודה עבור כל אירוע.", + "hint": "ה‑payload נשלח ל‑stdin כ‑JSON.", + "commandPlaceholder": "פקודה להרצה" + }, + "test": { + "button": "בדיקה", + "testing": "בבדיקה...", + "success": "הצלחה", + "failed": "נכשל", + "duration": "{ms} ms", + "statusCode": "HTTP {code}", + "exitCode": "קוד יציאה {code}", + "retryAfter": "נסה שוב בעוד {ms} ms", + "stdout": "stdout", + "stderr": "stderr" + } + }, "data": { "title": "הגדרות נתונים", "syncEnable": "הפעל סנכרון נתונים", diff --git a/src/renderer/src/i18n/ja-JP/routes.json b/src/renderer/src/i18n/ja-JP/routes.json index d538ffc04..5828db2be 100644 --- a/src/renderer/src/i18n/ja-JP/routes.json +++ b/src/renderer/src/i18n/ja-JP/routes.json @@ -14,5 +14,6 @@ "settings-prompt": "プロンプト管理", "settings-mcp-market": "MCP市場", "settings-acp": "ACPエージェント", - "settings-skills": "Skills" + "settings-skills": "Skills", + "settings-notifications-hooks": "通知とフック" } diff --git a/src/renderer/src/i18n/ja-JP/settings.json b/src/renderer/src/i18n/ja-JP/settings.json index b62b868e6..0c6f28626 100644 --- a/src/renderer/src/i18n/ja-JP/settings.json +++ b/src/renderer/src/i18n/ja-JP/settings.json @@ -64,6 +64,60 @@ "fileMaxSize": "ファイルの最大サイズ", "fileMaxSizeHint": "アップロードできるファイルの最大サイズを制限します" }, + "notificationsHooks": { + "title": "通知とフック", + "description": "Webhook 通知とライフサイクルフックを設定します。", + "events": { + "title": "イベント", + "SessionStart": "セッション開始", + "UserPromptSubmit": "ユーザープロンプト送信", + "PreToolUse": "ツール使用前", + "PostToolUse": "ツール使用後", + "PostToolUseFailure": "ツール使用失敗", + "PermissionRequest": "権限リクエスト", + "Stop": "停止", + "SessionEnd": "セッション終了" + }, + "telegram": { + "title": "Telegram", + "description": "Telegram ボットで通知を送信します。", + "botToken": "ボットトークン", + "botTokenPlaceholder": "Telegram ボットトークン", + "chatId": "チャット ID", + "chatIdPlaceholder": "例: 123456789", + "threadId": "スレッド ID(任意)", + "threadIdPlaceholder": "任意のスレッド ID" + }, + "discord": { + "title": "Discord", + "description": "Discord の Webhook で通知を送信します。", + "webhookUrl": "Webhook URL", + "webhookUrlPlaceholder": "https://discord.com/api/webhooks/..." + }, + "confirmo": { + "title": "Confirmo", + "description": "Confirmo フックで通知を送信します(全イベント)。", + "unavailable": "Confirmo フックが見つかりません: {path}" + }, + "commands": { + "title": "フックコマンド", + "description": "各イベントごとにコマンドを実行します。", + "hint": "ペイロードは JSON として stdin に送信されます。", + "commandPlaceholder": "実行するコマンド" + }, + "test": { + "button": "テスト", + "testing": "テスト中...", + "success": "成功", + "failed": "失敗", + "duration": "{ms} ms", + "statusCode": "HTTP {code}", + "exitCode": "終了コード {code}", + "retryAfter": "{ms} ms 後に再試行", + "stdout": "stdout", + "stderr": "stderr" + } + }, "data": { "title": "データ設定", "syncEnable": "データ同期を有効にする", diff --git a/src/renderer/src/i18n/ko-KR/routes.json b/src/renderer/src/i18n/ko-KR/routes.json index d295549d4..6a5477c96 100644 --- a/src/renderer/src/i18n/ko-KR/routes.json +++ b/src/renderer/src/i18n/ko-KR/routes.json @@ -14,5 +14,6 @@ "settings-prompt": "프롬프트 관리", "settings-mcp-market": "MCP 시장", "settings-acp": "ACP 프록시", - "settings-skills": "Skills" + "settings-skills": "Skills", + "settings-notifications-hooks": "알림 및 훅" } diff --git a/src/renderer/src/i18n/ko-KR/settings.json b/src/renderer/src/i18n/ko-KR/settings.json index 9cceae769..7bc58d0d1 100644 --- a/src/renderer/src/i18n/ko-KR/settings.json +++ b/src/renderer/src/i18n/ko-KR/settings.json @@ -64,6 +64,60 @@ "fileMaxSize": "파일 최대 크기", "fileMaxSizeHint": "단일 파일 업로드의 최대 크기를 제한합니다" }, + "notificationsHooks": { + "title": "알림 및 훅", + "description": "웹훅 알림과 라이프사이클 훅을 설정합니다.", + "events": { + "title": "이벤트", + "SessionStart": "세션 시작", + "UserPromptSubmit": "사용자 프롬프트 전송", + "PreToolUse": "도구 사용 전", + "PostToolUse": "도구 사용 후", + "PostToolUseFailure": "도구 사용 실패", + "PermissionRequest": "권한 요청", + "Stop": "중지", + "SessionEnd": "세션 종료" + }, + "telegram": { + "title": "Telegram", + "description": "Telegram 봇으로 알림을 전송합니다.", + "botToken": "봇 토큰", + "botTokenPlaceholder": "Telegram 봇 토큰", + "chatId": "채팅 ID", + "chatIdPlaceholder": "예: 123456789", + "threadId": "스레드 ID(선택 사항)", + "threadIdPlaceholder": "선택 사항 스레드 ID" + }, + "discord": { + "title": "Discord", + "description": "Discord 웹훅으로 알림을 전송합니다.", + "webhookUrl": "웹훅 URL", + "webhookUrlPlaceholder": "https://discord.com/api/webhooks/..." + }, + "confirmo": { + "title": "Confirmo", + "description": "Confirmo 훅으로 알림을 전송합니다(모든 이벤트).", + "unavailable": "Confirmo 훅을 찾을 수 없습니다: {path}" + }, + "commands": { + "title": "훅 명령", + "description": "각 이벤트마다 명령을 실행합니다.", + "hint": "페이로드가 JSON으로 stdin에 전송됩니다.", + "commandPlaceholder": "실행할 명령" + }, + "test": { + "button": "테스트", + "testing": "테스트 중...", + "success": "성공", + "failed": "실패", + "duration": "{ms} ms", + "statusCode": "HTTP {code}", + "exitCode": "종료 코드 {code}", + "retryAfter": "{ms} ms 후 재시도", + "stdout": "stdout", + "stderr": "stderr" + } + }, "data": { "title": "데이터 설정", "syncEnable": "데이터 동기화 활성화", diff --git a/src/renderer/src/i18n/pt-BR/routes.json b/src/renderer/src/i18n/pt-BR/routes.json index 8c0fbb7e8..762f4c572 100644 --- a/src/renderer/src/i18n/pt-BR/routes.json +++ b/src/renderer/src/i18n/pt-BR/routes.json @@ -14,5 +14,6 @@ "settings-prompt": "Prompts", "settings-mcp-market": "Mercado MCP", "settings-acp": "Proxy ACP", - "settings-skills": "Skills" + "settings-skills": "Skills", + "settings-notifications-hooks": "Notificações e hooks" } diff --git a/src/renderer/src/i18n/pt-BR/settings.json b/src/renderer/src/i18n/pt-BR/settings.json index 1fafdadc4..7a07896a6 100644 --- a/src/renderer/src/i18n/pt-BR/settings.json +++ b/src/renderer/src/i18n/pt-BR/settings.json @@ -64,6 +64,60 @@ "fileMaxSize": "Tamanho máximo do arquivo", "fileMaxSizeHint": "Limita o tamanho máximo de um arquivo enviado" }, + "notificationsHooks": { + "title": "Notificações e hooks", + "description": "Configure notificações de webhook e hooks de ciclo de vida.", + "events": { + "title": "Eventos", + "SessionStart": "Início da sessão", + "UserPromptSubmit": "Envio do prompt do usuário", + "PreToolUse": "Antes do uso da ferramenta", + "PostToolUse": "Após o uso da ferramenta", + "PostToolUseFailure": "Falha no uso da ferramenta", + "PermissionRequest": "Solicitação de permissão", + "Stop": "Parada", + "SessionEnd": "Fim da sessão" + }, + "telegram": { + "title": "Telegram", + "description": "Enviar notificações via bot do Telegram.", + "botToken": "Token do bot", + "botTokenPlaceholder": "Token do bot do Telegram", + "chatId": "ID do chat", + "chatIdPlaceholder": "ex.: 123456789", + "threadId": "ID da thread (opcional)", + "threadIdPlaceholder": "ID de thread opcional" + }, + "discord": { + "title": "Discord", + "description": "Enviar notificações via webhook do Discord.", + "webhookUrl": "URL do webhook", + "webhookUrlPlaceholder": "https://discord.com/api/webhooks/..." + }, + "confirmo": { + "title": "Confirmo", + "description": "Enviar notificações via hook Confirmo (todos os eventos).", + "unavailable": "Hook do Confirmo não encontrado: {path}" + }, + "commands": { + "title": "Comandos de hook", + "description": "Executar um comando para cada evento.", + "hint": "O payload é enviado para o stdin em JSON.", + "commandPlaceholder": "Comando a executar" + }, + "test": { + "button": "Testar", + "testing": "Testando...", + "success": "Sucesso", + "failed": "Falhou", + "duration": "{ms} ms", + "statusCode": "HTTP {code}", + "exitCode": "Código de saída {code}", + "retryAfter": "Tentar novamente em {ms} ms", + "stdout": "stdout", + "stderr": "stderr" + } + }, "data": { "title": "Configurações de Dados", "syncEnable": "Habilitar Sincronização de Dados", diff --git a/src/renderer/src/i18n/ru-RU/routes.json b/src/renderer/src/i18n/ru-RU/routes.json index a38507ed9..b10e02fd9 100644 --- a/src/renderer/src/i18n/ru-RU/routes.json +++ b/src/renderer/src/i18n/ru-RU/routes.json @@ -14,5 +14,6 @@ "settings-prompt": "Управление промптами", "settings-mcp-market": "MCP Market", "settings-acp": "ACP-агент", - "settings-skills": "Skills" + "settings-skills": "Skills", + "settings-notifications-hooks": "Уведомления и хуки" } diff --git a/src/renderer/src/i18n/ru-RU/settings.json b/src/renderer/src/i18n/ru-RU/settings.json index 6fff73006..1b89e2480 100644 --- a/src/renderer/src/i18n/ru-RU/settings.json +++ b/src/renderer/src/i18n/ru-RU/settings.json @@ -64,6 +64,60 @@ "fileMaxSize": "Максимальный размер файла", "fileMaxSizeHint": "Ограничивает максимальный размер загружаемого файла" }, + "notificationsHooks": { + "title": "Уведомления и хуки", + "description": "Настройте webhook-уведомления и хуки жизненного цикла.", + "events": { + "title": "События", + "SessionStart": "Начало сессии", + "UserPromptSubmit": "Отправка пользовательского промпта", + "PreToolUse": "Перед использованием инструмента", + "PostToolUse": "После использования инструмента", + "PostToolUseFailure": "Сбой использования инструмента", + "PermissionRequest": "Запрос разрешения", + "Stop": "Остановка", + "SessionEnd": "Конец сессии" + }, + "telegram": { + "title": "Telegram", + "description": "Отправлять уведомления через бота Telegram.", + "botToken": "Токен бота", + "botTokenPlaceholder": "Токен бота Telegram", + "chatId": "ID чата", + "chatIdPlaceholder": "например 123456789", + "threadId": "ID треда (необязательно)", + "threadIdPlaceholder": "Необязательный ID треда" + }, + "discord": { + "title": "Discord", + "description": "Отправлять уведомления через webhook Discord.", + "webhookUrl": "URL вебхука", + "webhookUrlPlaceholder": "https://discord.com/api/webhooks/..." + }, + "confirmo": { + "title": "Confirmo", + "description": "Отправлять уведомления через хук Confirmo (все события).", + "unavailable": "Хук Confirmo не найден: {path}" + }, + "commands": { + "title": "Команды хуков", + "description": "Выполнять команду для каждого события.", + "hint": "Пейлоад отправляется в stdin в формате JSON.", + "commandPlaceholder": "Команда для запуска" + }, + "test": { + "button": "Тест", + "testing": "Тестирование...", + "success": "Успех", + "failed": "Ошибка", + "duration": "{ms} мс", + "statusCode": "HTTP {code}", + "exitCode": "Код выхода {code}", + "retryAfter": "Повторить через {ms} мс", + "stdout": "stdout", + "stderr": "stderr" + } + }, "data": { "title": "Настройки данных", "syncEnable": "Включить синхронизацию данных", diff --git a/src/renderer/src/i18n/zh-CN/routes.json b/src/renderer/src/i18n/zh-CN/routes.json index f16824bec..b7fe8c6b9 100644 --- a/src/renderer/src/i18n/zh-CN/routes.json +++ b/src/renderer/src/i18n/zh-CN/routes.json @@ -14,5 +14,6 @@ "settings-prompt": "Prompt管理", "settings-mcp-market": "MCP市场", "settings-acp": "ACP Agent", - "settings-skills": "skills设置" + "settings-skills": "skills设置", + "settings-notifications-hooks": "通知与Hooks" } diff --git a/src/renderer/src/i18n/zh-CN/settings.json b/src/renderer/src/i18n/zh-CN/settings.json index f763b2742..c33f419ed 100644 --- a/src/renderer/src/i18n/zh-CN/settings.json +++ b/src/renderer/src/i18n/zh-CN/settings.json @@ -64,6 +64,60 @@ "fileMaxSize": "文件最大大小", "fileMaxSizeHint": "限制单个文件的最大上传大小" }, + "notificationsHooks": { + "title": "通知与Hooks", + "description": "配置 webhook 通知与生命周期 hooks。", + "events": { + "title": "事件", + "SessionStart": "会话开始", + "UserPromptSubmit": "用户提交", + "PreToolUse": "工具调用前", + "PostToolUse": "工具调用后", + "PostToolUseFailure": "工具调用失败", + "PermissionRequest": "权限请求", + "Stop": "停止", + "SessionEnd": "会话结束" + }, + "telegram": { + "title": "Telegram", + "description": "通过 Telegram Bot 发送通知。", + "botToken": "Bot Token", + "botTokenPlaceholder": "Telegram Bot Token", + "chatId": "Chat ID", + "chatIdPlaceholder": "例如 123456789", + "threadId": "Thread ID(可选)", + "threadIdPlaceholder": "可选 Thread ID" + }, + "discord": { + "title": "Discord", + "description": "通过 Discord webhook 发送通知。", + "webhookUrl": "Webhook URL", + "webhookUrlPlaceholder": "https://discord.com/api/webhooks/..." + }, + "confirmo": { + "title": "Confirmo", + "description": "通过 Confirmo Hook 发送通知(默认发送全部事件)。", + "unavailable": "未找到 Confirmo Hook:{path}" + }, + "commands": { + "title": "Hooks Commands", + "description": "为每个事件执行命令。", + "hint": "payload 以 JSON 写入 stdin。", + "commandPlaceholder": "要执行的命令" + }, + "test": { + "button": "测试", + "testing": "测试中...", + "success": "成功", + "failed": "失败", + "duration": "{ms} ms", + "statusCode": "HTTP {code}", + "exitCode": "退出码 {code}", + "retryAfter": "重试等待 {ms} ms", + "stdout": "stdout", + "stderr": "stderr" + } + }, "data": { "title": "数据设置", "syncEnable": "启用数据同步", diff --git a/src/renderer/src/i18n/zh-HK/routes.json b/src/renderer/src/i18n/zh-HK/routes.json index f6536be63..1281f5f92 100644 --- a/src/renderer/src/i18n/zh-HK/routes.json +++ b/src/renderer/src/i18n/zh-HK/routes.json @@ -14,5 +14,6 @@ "settings-mcp-market": "MCP市場", "playground": "Playground 實驗室", "settings-acp": "ACP Agent", - "settings-skills": "skills設置" + "settings-skills": "skills設置", + "settings-notifications-hooks": "通知與 Hooks" } diff --git a/src/renderer/src/i18n/zh-HK/settings.json b/src/renderer/src/i18n/zh-HK/settings.json index 046b7f0f5..ec2bfd1da 100644 --- a/src/renderer/src/i18n/zh-HK/settings.json +++ b/src/renderer/src/i18n/zh-HK/settings.json @@ -64,6 +64,60 @@ "fileMaxSize": "檔案最大大小", "fileMaxSizeHint": "限制單個檔案的最大上傳大小" }, + "notificationsHooks": { + "title": "通知與 Hooks", + "description": "配置 webhook 通知與生命週期 Hooks。", + "events": { + "title": "事件", + "SessionStart": "會話開始", + "UserPromptSubmit": "使用者提示送出", + "PreToolUse": "使用工具前", + "PostToolUse": "使用工具後", + "PostToolUseFailure": "工具使用失敗", + "PermissionRequest": "權限請求", + "Stop": "停止", + "SessionEnd": "會話結束" + }, + "telegram": { + "title": "Telegram", + "description": "透過 Telegram 機器人發送通知。", + "botToken": "機器人 Token", + "botTokenPlaceholder": "Telegram 機器人 Token", + "chatId": "聊天 ID", + "chatIdPlaceholder": "例如 123456789", + "threadId": "主題 ID(可選)", + "threadIdPlaceholder": "可選的主題 ID" + }, + "discord": { + "title": "Discord", + "description": "透過 Discord webhook 發送通知。", + "webhookUrl": "Webhook URL", + "webhookUrlPlaceholder": "https://discord.com/api/webhooks/..." + }, + "confirmo": { + "title": "Confirmo", + "description": "透過 Confirmo hook 發送通知(所有事件)。", + "unavailable": "找不到 Confirmo hook:{path}" + }, + "commands": { + "title": "Hooks 指令", + "description": "每個事件執行一個指令。", + "hint": "Payload 會以 JSON 傳送到 stdin。", + "commandPlaceholder": "要執行的指令" + }, + "test": { + "button": "測試", + "testing": "測試中...", + "success": "成功", + "failed": "失敗", + "duration": "{ms} ms", + "statusCode": "HTTP {code}", + "exitCode": "退出碼 {code}", + "retryAfter": "在 {ms} ms 後重試", + "stdout": "stdout", + "stderr": "stderr" + } + }, "data": { "title": "數據設置", "syncEnable": "啟用數據同步", diff --git a/src/renderer/src/i18n/zh-TW/routes.json b/src/renderer/src/i18n/zh-TW/routes.json index b623b87b1..54762fc6d 100644 --- a/src/renderer/src/i18n/zh-TW/routes.json +++ b/src/renderer/src/i18n/zh-TW/routes.json @@ -14,5 +14,6 @@ "settings-mcp-market": "MCP市場", "playground": "Playground 實驗室", "settings-acp": "ACP Agent", - "settings-skills": "skills管理" + "settings-skills": "skills管理", + "settings-notifications-hooks": "通知與 Hooks" } diff --git a/src/renderer/src/i18n/zh-TW/settings.json b/src/renderer/src/i18n/zh-TW/settings.json index 467548701..4217824cf 100644 --- a/src/renderer/src/i18n/zh-TW/settings.json +++ b/src/renderer/src/i18n/zh-TW/settings.json @@ -64,6 +64,60 @@ "fileMaxSize": "檔案最大大小", "fileMaxSizeHint": "限制單個檔案的最大上傳大小" }, + "notificationsHooks": { + "title": "通知與 Hooks", + "description": "設定 webhook 通知與生命週期 Hooks。", + "events": { + "title": "事件", + "SessionStart": "會話開始", + "UserPromptSubmit": "使用者提示送出", + "PreToolUse": "使用工具前", + "PostToolUse": "使用工具後", + "PostToolUseFailure": "工具使用失敗", + "PermissionRequest": "權限請求", + "Stop": "停止", + "SessionEnd": "會話結束" + }, + "telegram": { + "title": "Telegram", + "description": "透過 Telegram 機器人發送通知。", + "botToken": "機器人 Token", + "botTokenPlaceholder": "Telegram 機器人 Token", + "chatId": "聊天 ID", + "chatIdPlaceholder": "例如 123456789", + "threadId": "主題 ID(選填)", + "threadIdPlaceholder": "選填主題 ID" + }, + "discord": { + "title": "Discord", + "description": "透過 Discord webhook 發送通知。", + "webhookUrl": "Webhook URL", + "webhookUrlPlaceholder": "https://discord.com/api/webhooks/..." + }, + "confirmo": { + "title": "Confirmo", + "description": "透過 Confirmo hook 發送通知(所有事件)。", + "unavailable": "找不到 Confirmo hook:{path}" + }, + "commands": { + "title": "Hooks 指令", + "description": "每個事件執行一個指令。", + "hint": "Payload 會以 JSON 傳送到 stdin。", + "commandPlaceholder": "要執行的指令" + }, + "test": { + "button": "測試", + "testing": "測試中...", + "success": "成功", + "failed": "失敗", + "duration": "{ms} ms", + "statusCode": "HTTP {code}", + "exitCode": "退出碼 {code}", + "retryAfter": "在 {ms} ms 後重試", + "stdout": "stdout", + "stderr": "stderr" + } + }, "data": { "title": "資料設定", "syncEnable": "啟用資料同步", diff --git a/src/shared/hooksNotifications.ts b/src/shared/hooksNotifications.ts new file mode 100644 index 000000000..6e1ccb2e6 --- /dev/null +++ b/src/shared/hooksNotifications.ts @@ -0,0 +1,111 @@ +export const HOOK_EVENT_NAMES = [ + 'SessionStart', + 'UserPromptSubmit', + 'PreToolUse', + 'PostToolUse', + 'PostToolUseFailure', + 'PermissionRequest', + 'Stop', + 'SessionEnd' +] as const + +export type HookEventName = (typeof HOOK_EVENT_NAMES)[number] + +export const DEFAULT_IMPORTANT_HOOK_EVENTS: HookEventName[] = [ + 'SessionStart', + 'SessionEnd', + 'PostToolUseFailure', + 'PermissionRequest', + 'Stop' +] + +export type HookChannel = 'telegram' | 'discord' | 'confirmo' | 'command' + +export interface HookCommandConfig { + enabled: boolean + command: string +} + +export interface HookCommandsConfig { + enabled: boolean + events: Record +} + +export interface TelegramNotificationsConfig { + enabled: boolean + botToken: string + chatId: string + threadId?: string + events: HookEventName[] +} + +export interface DiscordNotificationsConfig { + enabled: boolean + webhookUrl: string + events: HookEventName[] +} + +export interface ConfirmoNotificationsConfig { + enabled: boolean + events: HookEventName[] +} + +export interface HooksNotificationsSettings { + telegram: TelegramNotificationsConfig + discord: DiscordNotificationsConfig + confirmo: ConfirmoNotificationsConfig + commands: HookCommandsConfig +} + +export interface HookEventPayload { + payloadVersion: 1 + event: HookEventName + time: string + isTest: boolean + app: { + version: string + platform: string + } + session: { + conversationId?: string + agentId?: string | null + workdir?: string | null + providerId?: string + modelId?: string + } + user?: { + messageId?: string + promptPreview?: string + } | null + tool?: { + callId?: string + name?: string + paramsPreview?: string + responsePreview?: string + error?: string + } | null + permission?: Record | null + stop?: { + reason?: string + userStop?: boolean + } | null + usage?: Record | null + error?: { + message?: string + stack?: string + } | null +} + +export interface HookCommandResult { + success: boolean + durationMs: number + exitCode?: number | null + stdout?: string + stderr?: string + error?: string +} + +export interface HookTestResult extends HookCommandResult { + statusCode?: number + retryAfterMs?: number +} diff --git a/src/shared/types/index.d.ts b/src/shared/types/index.d.ts index 60c03707e..6753f62ae 100644 --- a/src/shared/types/index.d.ts +++ b/src/shared/types/index.d.ts @@ -4,6 +4,7 @@ export type * from './presenters/legacy.presenters' export type * from './presenters/agent-provider' export type * from './presenters/workspace' export type * from './presenters/tool.presenter' +export type * from '../hooksNotifications' export * from './browser' export * from './chatSettings' export * from './skill' diff --git a/src/shared/types/presenters/legacy.presenters.d.ts b/src/shared/types/presenters/legacy.presenters.d.ts index 0ee90004e..a3e0940c9 100644 --- a/src/shared/types/presenters/legacy.presenters.d.ts +++ b/src/shared/types/presenters/legacy.presenters.d.ts @@ -4,6 +4,11 @@ import { MessageFile } from './chat' import { ShowResponse } from 'ollama' import { ShortcutKeySetting } from '@/presenter/configPresenter/shortcutKeySettings' import { ApiEndpointType, ModelType } from '@shared/model' +import type { + HookEventName, + HookTestResult, + HooksNotificationsSettings +} from '../../hooksNotifications' import type { NowledgeMemThread, NowledgeMemExportSummary } from '../nowledgeMem' import { ProviderChange, ProviderBatchUpdate } from './provider-operations' import type { AgentSessionLifecycleStatus } from './agent-provider' @@ -560,6 +565,14 @@ export interface IConfigPresenter { setSyncFolderPath(folderPath: string): void getLastSyncTime(): number setLastSyncTime(time: number): void + // Hooks & notifications settings + getHooksNotificationsConfig(): HooksNotificationsSettings + setHooksNotificationsConfig(config: HooksNotificationsSettings): HooksNotificationsSettings + getConfirmoHookStatus(): { available: boolean; path: string } + testTelegramNotification(): Promise + testDiscordNotification(): Promise + testConfirmoNotification(): Promise + testHookCommand(eventName: HookEventName): Promise // Skills settings getSkillsEnabled(): boolean setSkillsEnabled(enabled: boolean): void diff --git a/test/main/presenter/hooksNotifications.test.ts b/test/main/presenter/hooksNotifications.test.ts new file mode 100644 index 000000000..59b34c53a --- /dev/null +++ b/test/main/presenter/hooksNotifications.test.ts @@ -0,0 +1,102 @@ +import { describe, it, expect, vi } from 'vitest' +import { truncateText, parseRetryAfterMs } from '../../../src/main/presenter/hooksNotifications' +import { + normalizeHooksNotificationsConfig, + createDefaultHooksNotificationsConfig +} from '../../../src/main/presenter/hooksNotifications/config' +import { + DEFAULT_IMPORTANT_HOOK_EVENTS, + HOOK_EVENT_NAMES +} from '../../../src/shared/hooksNotifications' + +vi.mock('electron-log', () => ({ + default: { + warn: vi.fn(), + info: vi.fn(), + error: vi.fn() + } +})) + +describe('hooksNotifications', () => { + it('truncateText keeps short strings intact', () => { + expect(truncateText('hello', 10)).toBe('hello') + }) + + it('truncateText truncates with suffix', () => { + const result = truncateText('abcdefghijklmnopqrstuvwxyz', 20) + expect(result.endsWith(' ...(truncated)')).toBe(true) + expect(result.length).toBe(20) + }) + + it('parseRetryAfterMs reads seconds header', () => { + const response = new Response(null, { + status: 429, + headers: { 'retry-after': '2' } + }) + expect(parseRetryAfterMs(response)).toBe(2000) + }) + + it('parseRetryAfterMs reads ms header', () => { + const response = new Response(null, { + status: 429, + headers: { 'retry-after': '1200' } + }) + expect(parseRetryAfterMs(response)).toBe(1200) + }) + + it('parseRetryAfterMs reads retry_after from body', () => { + const response = new Response(null, { status: 429 }) + expect(parseRetryAfterMs(response, { retry_after: 3 })).toBe(3000) + }) + + it('normalizeHooksNotificationsConfig sanitizes events and commands', () => { + const input = { + telegram: { + enabled: true, + botToken: 'token', + chatId: 'chat', + events: ['SessionStart', 'UnknownEvent'] + }, + discord: { + enabled: true, + events: [] + }, + confirmo: { + enabled: true, + events: ['Stop', 'UnknownEvent'] + }, + commands: { + enabled: true, + events: { + SessionStart: { enabled: true, command: 'echo ok' }, + UnknownEvent: { enabled: true, command: 'bad' } + } + }, + extra: 'ignored' + } + + const normalized = normalizeHooksNotificationsConfig(input) + + expect(normalized.telegram.enabled).toBe(true) + expect(normalized.telegram.botToken).toBe('token') + expect(normalized.telegram.chatId).toBe('chat') + expect(normalized.telegram.events).toEqual(['SessionStart']) + + expect(normalized.discord.enabled).toBe(true) + expect(normalized.discord.events).toEqual(DEFAULT_IMPORTANT_HOOK_EVENTS) + + expect(normalized.confirmo.enabled).toBe(true) + expect(normalized.confirmo.events).toEqual([...HOOK_EVENT_NAMES]) + + expect(Object.keys(normalized.commands.events)).toEqual([...HOOK_EVENT_NAMES]) + expect(normalized.commands.events.SessionStart.enabled).toBe(true) + expect(normalized.commands.events.SessionStart.command).toBe('echo ok') + }) + + it('normalizeHooksNotificationsConfig falls back to defaults', () => { + const defaults = createDefaultHooksNotificationsConfig() + const normalized = normalizeHooksNotificationsConfig(null) + + expect(normalized).toEqual(defaults) + }) +}) From 347e95db131d13d6ecbb62be6931c0c69f1ce485 Mon Sep 17 00:00:00 2001 From: zerob13 Date: Mon, 9 Feb 2026 20:55:20 +0800 Subject: [PATCH 4/4] chore: update 0.5.8 --- CHANGELOG.md | 7 + package.json | 2 +- resources/model-db/providers.json | 266 +++++++++++++++++++++--------- 3 files changed, 195 insertions(+), 80 deletions(-) diff --git a/CHANGELOG.md b/CHANGELOG.md index c00f3792e..8e6595866 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -1,4 +1,11 @@ # Changelog + +## v0.5.8 (2026-02-09) +- OpenAI 默认改为 Responses API +- 支持了 Telegram/Discord/Confirmo 通知 +- 支持任务生命周期 hooks +- 修复少量 Bug + ## v0.5.7 (2026-02-05) - 完善 Skills 支持 - Agent 现在可以生成可交互的提问信息 diff --git a/package.json b/package.json index 8a34cc198..9dda2974d 100644 --- a/package.json +++ b/package.json @@ -1,6 +1,6 @@ { "name": "DeepChat", - "version": "0.5.7", + "version": "0.5.8", "description": "DeepChat,一个简单易用的 Agent 客户端", "main": "./out/main/index.js", "author": "ThinkInAIXYZ", diff --git a/resources/model-db/providers.json b/resources/model-db/providers.json index 08c353c85..e2b181caf 100644 --- a/resources/model-db/providers.json +++ b/resources/model-db/providers.json @@ -51993,8 +51993,7 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, @@ -52812,7 +52811,7 @@ "context": 400000, "output": 64000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -53053,7 +53052,7 @@ "context": 400000, "output": 64000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -53916,6 +53915,41 @@ "cache_write": 3.75 } }, + { + "id": "anthropic/claude-opus-4.6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2026-02-06", + "last_updated": "2026-02-06", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + } + }, { "id": "deepseek/deepseek-chat-v3.1", "name": "DeepSeek: DeepSeek V3.1", @@ -56426,6 +56460,40 @@ "output": 2 } }, + { + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "cost": { + "input": 0.5, + "output": 2.8 + } + }, { "id": "moonshotai/Kimi-K2-Thinking", "name": "Kimi K2 Thinking", @@ -60682,7 +60750,7 @@ ] }, "limit": { - "context": 1000000, + "context": 200000, "output": 128000 }, "temperature": true, @@ -61426,6 +61494,42 @@ "output": 0 } }, + { + "id": "duo-chat-opus-4-6", + "name": "Agentic Chat (Claude Opus 4.6)", + "display_name": "Agentic Chat (Claude Opus 4.6)", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 64000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + } + }, { "id": "duo-chat-gpt-5-2", "name": "Agentic Chat (GPT-5.2)", @@ -78265,6 +78369,31 @@ "open_weights": true, "release_date": "2025-06-15", "last_updated": "2026-01-19" + }, + { + "id": "qwen3-coder-next", + "name": "qwen3-coder-next", + "display_name": "qwen3-coder-next", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-02", + "last_updated": "2026-02-08" } ] }, @@ -98868,28 +98997,6 @@ }, "type": "chat" }, - { - "id": "ai21/jamba-mini-1.7", - "name": "AI21: Jamba Mini 1.7", - "display_name": "AI21: Jamba Mini 1.7", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 4096 - }, - "tool_call": true, - "reasoning": { - "supported": false - }, - "type": "chat" - }, { "id": "aion-labs/aion-1.0", "name": "AionLabs: Aion-1.0", @@ -102372,7 +102479,7 @@ }, "limit": { "context": 32768, - "output": 32768 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -102616,29 +102723,6 @@ "supported": false } }, - { - "id": "moonshotai/kimi-dev-72b", - "name": "MoonshotAI: Kimi Dev 72B", - "display_name": "MoonshotAI: Kimi Dev 72B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 131072 - }, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true - }, - "type": "chat" - }, { "id": "moonshotai/kimi-k2", "name": "MoonshotAI: Kimi K2 0711", @@ -102743,7 +102827,7 @@ }, "limit": { "context": 262144, - "output": 65535 + "output": 262144 }, "tool_call": true, "reasoning": { @@ -104717,6 +104801,30 @@ }, "type": "imageGeneration" }, + { + "id": "openrouter/pony-alpha", + "name": "Pony Alpha", + "display_name": "Pony Alpha", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 131000 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, { "id": "perplexity/sonar", "name": "Perplexity: Sonar", @@ -106016,30 +106124,6 @@ }, "type": "chat" }, - { - "id": "stepfun-ai/step3", - "name": "StepFun: Step3", - "display_name": "StepFun: Step3", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 65536, - "output": 65536 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "type": "imageGeneration" - }, { "id": "stepfun/step-3.5-flash:free", "name": "StepFun: Step 3.5 Flash (free)", @@ -106672,7 +106756,7 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 98304 }, "temperature": true, "tool_call": true, @@ -106842,8 +106926,8 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 202752, + "output": 202752 }, "temperature": true, "tool_call": true, @@ -107044,6 +107128,30 @@ }, "type": "chat" }, + { + "id": "claude-opus-4-6", + "name": "claude-opus-4-6", + "display_name": "claude-opus-4-6", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 128000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, { "id": "claude-sonnet-4-20250514", "name": "claude-sonnet-4-20250514",